{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T12:12:43Z","timestamp":1775131963277,"version":"3.50.1"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T00:00:00Z","timestamp":1770076800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T00:00:00Z","timestamp":1770076800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Key Research and Development Program of Shaanxi Province","award":["2024SF-YBXM-681"],"award-info":[{"award-number":["2024SF-YBXM-681"]}]},{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"crossref","award":["2024YFF0907604"],"award-info":[{"award-number":["2024YFF0907604"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62572394"],"award-info":[{"award-number":["62572394"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s00530-025-02165-x","type":"journal-article","created":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T03:44:44Z","timestamp":1770090284000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Attention-guided multi-scale local reconstruction for point clouds via masked autoencoder self-supervised learning"],"prefix":"10.1007","volume":"32","author":[{"given":"Xin","family":"Cao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haoyu","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiaxu","family":"Shi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Linzhi","family":"Su","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinda","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kang","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,3]]},"reference":[{"key":"2165_CR1","unstructured":"Qi, C.R., Su, H., Mo, K., Guibas, L.J.: Pointnet: Deep learning on point sets for 3d classification and segmentation, in Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 652\u2013660. (2017)"},{"issue":"9","key":"2165_CR2","doi-asserted-by":"publisher","first-page":"11321","DOI":"10.1109\/TPAMI.2023.3262786","volume":"45","author":"A Xiao","year":"2023","unstructured":"Xiao, A., Huang, J., Guan, D., Zhang, X., Lu, S., Shao, L.: Unsupervised point cloud representation learning with deep neural networks: A survey. IEEE Trans. Pattern Anal. Mach. Intell. 45(9), 11321\u201311339 (2023)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"1","key":"2165_CR3","first-page":"857","volume":"35","author":"X Liu","year":"2021","unstructured":"Liu, X., et al.: Self-supervised learning: Generative or contrastive. IEEE Trans. Knowl. Data Eng. 35(1), 857\u2013876 (2021)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"1","key":"2165_CR4","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1109\/MSP.2017.2765202","volume":"35","author":"A Creswell","year":"2018","unstructured":"Creswell, A., White, T., Dumoulin, V., Arulkumaran, K., Sengupta, B., Bharath, A.A.: Generative adversarial networks: An overview. IEEE. Signal. Process. Mag. 35(1), 53\u201365 (2018)","journal-title":"IEEE. Signal. Process. Mag."},{"key":"2165_CR5","unstructured":"Kingma, D.P.: Auto-encoding variational bayes, arXiv preprint arXiv:1312.6114, (2013)"},{"key":"2165_CR6","doi-asserted-by":"crossref","unstructured":"Ye, M., Zhang, X., Yuen, P.C., Chang, S.-F.: Unsupervised embedding learning via invariant and spreading instance feature, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6210\u20136219. (2019)","DOI":"10.1109\/CVPR.2019.00637"},{"key":"2165_CR7","doi-asserted-by":"crossref","unstructured":"Poursaeed, O., Jiang, T., Qiao, H., Xu, N., Kim, V.G.: Self-supervised learning of point clouds via orientation estimation, in 2020 International Conference on 3D Vision (3DV), : IEEE, pp. 1018\u20131028. (2020)","DOI":"10.1109\/3DV50981.2020.00112"},{"key":"2165_CR8","doi-asserted-by":"crossref","unstructured":"Li, R., Li, X., Fu, C.-W., Cohen-Or, D., Heng, P.-A.: Pu-gan: a point cloud upsampling adversarial network, in Proceedings of the IEEE\/CVF international conference on computer vision, pp. 7203\u20137212. (2019)","DOI":"10.1109\/ICCV.2019.00730"},{"key":"2165_CR9","doi-asserted-by":"crossref","unstructured":"Park, J.H., Kim, J.H., Ngo, B.H., Cho, S.I.: Adversarial representation teaching with perturbation-agnostic student-teacher structure for semi-supervised learning. Available SSRN 4246745, (2023)","DOI":"10.2139\/ssrn.4246745"},{"key":"2165_CR10","doi-asserted-by":"crossref","unstructured":"Ngo, B.H., Choi, T.J.: Cross-domain knowledge distillation for domain adaptation with GCN-driven MLP generalization. Appl. Soft Comput., p. 113771, (2025)","DOI":"10.1016\/j.asoc.2025.113771"},{"key":"2165_CR11","doi-asserted-by":"crossref","unstructured":"Wang, S., Ren, W., Gao, P., Yu, J., Liu, J.: ZRID-Net: Zero-Reference Real-World Image Dehazing Framework Via Deep Self-Decoupling and Reverse Knowledge Transfer. IEEE Transactions on Circuits and Systems for Video Technology (2025)","DOI":"10.1109\/TCSVT.2025.3609735"},{"issue":"3","key":"2165_CR12","doi-asserted-by":"publisher","first-page":"1921","DOI":"10.1007\/s00371-024-03511-2","volume":"41","author":"S Wang","year":"2025","unstructured":"Wang, S., Hou, Q., Li, J., Liu, J.: TSID-Net: A two-stage single image dehazing framework with style transfer and contrastive knowledge transfer. Visual Comput. 41(3), 1921\u20131938 (2025)","journal-title":"Visual Comput."},{"key":"2165_CR13","doi-asserted-by":"publisher","first-page":"111997","DOI":"10.1016\/j.engappai.2025.111997","volume":"160","author":"J Wang","year":"2025","unstructured":"Wang, J., Wang, S., Pang, Y., Liu, J.: PromptDNet: A weakly supervised prompt framework for single image dehazing via dual-level depth cues. Eng. Appl. Artif. Intell. 160, 111997 (2025)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"2165_CR14","doi-asserted-by":"crossref","unstructured":"Ngo, B.H., Choi, T.J., Cho, S.I.: Towards Enhancing Prototypes Driven by Graph Convolutional Networkfor Domain Adaptation, Expert Systems with Applications, p. 130010, (2025)","DOI":"10.1016\/j.eswa.2025.130010"},{"key":"2165_CR15","unstructured":"Sauder, J., Sievers, B.: Self-supervised deep learning on point clouds by reconstructing space. Adv. Neural. Inf. Process. Syst., 32, (2019)"},{"key":"2165_CR16","doi-asserted-by":"crossref","unstructured":"Wang, H., Tang, Y., Wang, Y., Guo, J., Deng, Z.-H., Han, K.: Masked image modeling with local multi-scale reconstruction, in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2122\u20132131. (2023)","DOI":"10.1109\/CVPR52729.2023.00211"},{"key":"2165_CR17","doi-asserted-by":"crossref","unstructured":"Chen, H.-W., Xu, Y.-S., Hong, M.-F., Tsai, Y.-M., Kuo, H.-K., Lee, C.-Y.: Cascaded local implicit transformer for arbitrary-scale super-resolution, in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18257\u201318267. (2023)","DOI":"10.1109\/CVPR52729.2023.01751"},{"key":"2165_CR18","doi-asserted-by":"crossref","unstructured":"Liu, J., Pang, Y., Wang, S.: DCE-Net: a dual-frequency domain knowledge-guided framework for image dehazing via detail and content enhancements. IEEE. Signal. Process. Lett., (2025)","DOI":"10.1109\/LSP.2025.3551201"},{"key":"2165_CR19","unstructured":"Chang, A.X., et al.: Shapenet: An information-rich 3d model repository, arXiv preprint arXiv:1512.03012, (2015)"},{"key":"2165_CR20","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked autoencoders are scalable vision learners, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 16000\u201316009. (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"2165_CR21","unstructured":"Kenton, J.D.M.-W.C., Toutanova, L.K.: Bert: Pre-training of deep bidirectional transformers for language understanding, in Proceedings of naacL-HLT, vol. 1: Minneapolis, Minnesota, p. 2. (2019)"},{"key":"2165_CR22","doi-asserted-by":"crossref","unstructured":"Xie, Z., et al.: Simmim: A simple framework for masked image modeling, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9653\u20139663. (2022)","DOI":"10.1109\/CVPR52688.2022.00943"},{"key":"2165_CR23","doi-asserted-by":"crossref","unstructured":"Yu, X., Tang, L., Rao, Y., Huang, T., Zhou, J., Lu, J.: Point-bert: Pre-training 3d point cloud transformers with masked point modeling, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 19313\u201319322. (2022)","DOI":"10.1109\/CVPR52688.2022.01871"},{"key":"2165_CR24","doi-asserted-by":"crossref","unstructured":"Pang, Y., Wang, W., Tay, F.E., Liu, W., Tian, Y., Yuan, L.: Masked autoencoders for point cloud self-supervised learning, in European conference on computer vision, : Springer, pp. 604\u2013621. (2022)","DOI":"10.1007\/978-3-031-20086-1_35"},{"key":"2165_CR25","doi-asserted-by":"crossref","unstructured":"Li, H., et al.: Mask-Point: automatic 3D surface defects detection network for fiber-reinforced resin matrix composites, Polymers, vol. 14, no. 16, p. 3390, (2022)","DOI":"10.3390\/polym14163390"},{"key":"2165_CR26","first-page":"1","volume":"61","author":"Y Liu","year":"2023","unstructured":"Liu, Y., Yan, X., Li, Z., Chen, Z., Wei, Z., Wei, M.: PointGame: Geometrically and adaptively masked autoencoder on point clouds. IEEE Trans. Geosci. Remote Sens. 61, 1\u201312 (2023)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"2165_CR27","unstructured":"Zhang, X., Zhang, S., Yan, J.: PCP-MAE: Learning to Predict Centers for Point Masked Autoencoders, arXiv preprint arXiv:2408.08753, (2024)"},{"key":"2165_CR28","doi-asserted-by":"crossref","unstructured":"Lang, A.H., Vora, S., Caesar, H., Zhou, L., Yang, J., Beijbom, O.: Pointpillars: Fast encoders for object detection from point clouds, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12697\u201312705. (2019)","DOI":"10.1109\/CVPR.2019.01298"},{"key":"2165_CR29","doi-asserted-by":"crossref","unstructured":"Maturana, D., Scherer, S., Voxnet: A 3d convolutional neural network for real-time object recognition, in 2015 IEEE\/RSJ international conference on intelligent robots and systems (IROS), : IEEE, pp. 922\u2013928. (2015)","DOI":"10.1109\/IROS.2015.7353481"},{"key":"2165_CR30","unstructured":"Qi, C.R., Yi, L., Su, H., Guibas, L.J.: Pointnet++: Deep hierarchical feature learning on point sets in a metric space, Advances in neural information processing systems, vol. 30, (2017)"},{"issue":"5","key":"2165_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3326362","volume":"38","author":"Y Wang","year":"2019","unstructured":"Wang, Y., Sun, Y., Liu, Z., Sarma, S.E., Bronstein, M.M., Solomon, J.M.: Dynamic graph Cnn for learning on point clouds. ACM Trans. Graphics (tog). 38(5), 1\u201312 (2019)","journal-title":"ACM Trans. Graphics (tog)"},{"key":"2165_CR32","unstructured":"Vaswani, A.: Attention is all you need. Adv. Neural. Inf. Process. Syst., (2017)"},{"key":"2165_CR33","doi-asserted-by":"crossref","unstructured":"Zhao, H., Jiang, L., Jia, J., Torr, P.H., Koltun, V.: Point transformer, in Proceedings of the IEEE\/CVF international conference on computer vision, pp. 16259\u201316268. (2021)","DOI":"10.1109\/ICCV48922.2021.01595"},{"key":"2165_CR34","doi-asserted-by":"publisher","first-page":"111578","DOI":"10.1016\/j.patcog.2025.111578","volume":"164","author":"G Xiao","year":"2025","unstructured":"Xiao, G., Ge, S., Zhong, Y., Xiao, Z., Song, J., Lu, J.: SAPFormer: Shape-aware propagation transformer for point clouds. Pattern Recogn. 164, 111578 (2025)","journal-title":"Pattern Recogn."},{"key":"2165_CR35","doi-asserted-by":"publisher","first-page":"111361","DOI":"10.1016\/j.patcog.2025.111361","volume":"162","author":"S Guo","year":"2025","unstructured":"Guo, S., Cai, J., Hu, Y., Liu, Q., Xu, M.: LCASAFormer: Cross-attention enhanced backbone network for 3D point cloud tasks. Pattern Recogn. 162, 111361 (2025)","journal-title":"Pattern Recogn."},{"key":"2165_CR36","doi-asserted-by":"crossref","unstructured":"Afham, M., Dissanayake, I., Dissanayake, D., Dharmasiri, A., Thilakarathna, K., Rodrigo, R.: Crosspoint: Self-supervised cross-modal contrastive learning for 3d point cloud understanding, in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9902\u20139912. (2022)","DOI":"10.1109\/CVPR52688.2022.00967"},{"key":"2165_CR37","doi-asserted-by":"crossref","unstructured":"Huang, S., Xie, Y., Zhu, S.-C., Zhu, Y.: Spatio-temporal self-supervised representation learning for 3d point clouds, in Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6535\u20136545. (2021)","DOI":"10.1109\/ICCV48922.2021.00647"},{"key":"2165_CR38","doi-asserted-by":"crossref","unstructured":"Wang, H., Liu, Q., Yue, X., Lasenby, J., Kusner, M.J.: Unsupervised point cloud pre-training via occlusion completion, in Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9782\u20139792. (2021)","DOI":"10.1109\/ICCV48922.2021.00964"},{"key":"2165_CR39","first-page":"27061","volume":"35","author":"R Zhang","year":"2022","unstructured":"Zhang, R., et al.: Point-m2ae: multi-scale masked autoencoders for hierarchical point cloud pre-training. Adv. Neural. Inf. Process. Syst. 35, 27061\u201327074 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"2165_CR40","doi-asserted-by":"crossref","unstructured":"Wu, Z., et al.: 3d shapenets: A deep representation for volumetric shapes, in Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 1912\u20131920. (2015)","DOI":"10.1109\/CVPR.2015.7298801"},{"key":"2165_CR41","doi-asserted-by":"crossref","unstructured":"Uy, M.A., Pham, Q.-H., Hua, B.-S., Nguyen, T., Yeung, S.-K.: Revisiting point cloud classification: A new benchmark dataset and classification model on real-world data, in Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1588\u20131597. (2019)","DOI":"10.1109\/ICCV.2019.00167"},{"key":"2165_CR42","doi-asserted-by":"crossref","unstructured":"Armeni, I., et al.: 3d semantic parsing of large-scale indoor spaces, in Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 1534\u20131543. (2016)","DOI":"10.1109\/CVPR.2016.170"},{"key":"2165_CR43","unstructured":"Li, Y., Bu, R., Sun, M., Wu, W., Di, X., Chen, B.: Pointcnn: Convolution on x-transformed points, Advances in neural information processing systems, vol. 31, (2018)"},{"key":"2165_CR44","doi-asserted-by":"crossref","unstructured":"Liu, Y., Fan, B., Xiang, S., Pan, C.: Relation-shape convolutional neural network for point cloud analysis, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 8895\u20138904. (2019)","DOI":"10.1109\/CVPR.2019.00910"},{"key":"2165_CR45","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1007\/s41095-021-0229-5","volume":"7","author":"M-H Guo","year":"2021","unstructured":"Guo, M.-H., Cai, J.-X., Liu, Z.-N., Mu, T.-J., Martin, R.R., Hu, S.-M.: Pct: Point cloud transformer. Comput. Visual Media. 7, 187\u2013199 (2021)","journal-title":"Comput. Visual Media"},{"key":"2165_CR46","doi-asserted-by":"crossref","unstructured":"Xu, Y., Fan, T., Xu, M., Zeng, L., Qiao, Y.: Spidercnn: Deep learning on point sets with parameterized convolutional filters, in Proceedings of the European conference on computer vision (ECCV), pp. 87\u2013102. (2018)","DOI":"10.1007\/978-3-030-01237-3_6"},{"key":"2165_CR47","doi-asserted-by":"publisher","first-page":"4436","DOI":"10.1109\/TIP.2021.3072214","volume":"30","author":"S Cheng","year":"2021","unstructured":"Cheng, S., Chen, X., He, X., Liu, Z., Bai, X.: Pra-net: Point relation-aware network for 3d point cloud analysis. IEEE Trans. Image Process. 30, 4436\u20134448 (2021)","journal-title":"IEEE Trans. Image Process."}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-025-02165-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-025-02165-x","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-025-02165-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T11:35:14Z","timestamp":1775129714000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-025-02165-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,3]]},"references-count":47,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["2165"],"URL":"https:\/\/doi.org\/10.1007\/s00530-025-02165-x","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,3]]},"assertion":[{"value":"5 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 December 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"N\/A.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}],"article-number":"109"}}