{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,22]],"date-time":"2026-06-22T22:07:03Z","timestamp":1782166023420,"version":"3.54.5"},"reference-count":88,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2025,4,10]],"date-time":"2025-04-10T00:00:00Z","timestamp":1744243200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,4,10]],"date-time":"2025-04-10T00:00:00Z","timestamp":1744243200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2025,6]]},"DOI":"10.1007\/s00530-025-01777-7","type":"journal-article","created":{"date-parts":[[2025,4,10]],"date-time":"2025-04-10T03:27:34Z","timestamp":1744255654000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["3D point cloud semantic segmentation based on visual guidance and feature enhancement"],"prefix":"10.1007","volume":"31","author":[{"given":"Sitong","family":"Chen","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yucheng","family":"Shu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lihong","family":"Qiao","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zhengyang","family":"Wu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jing","family":"Ling","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jiang","family":"Wu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Weisheng","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,4,10]]},"reference":[{"key":"1777_CR1","doi-asserted-by":"crossref","unstructured":"Qi, C.R., Liu, W., Wu, C., Su, H., Guibas, L.J.: Frustum pointnets for 3d object detection from rgb-d data. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 918\u2013927 (2018)","DOI":"10.1109\/CVPR.2018.00102"},{"issue":"2","key":"1777_CR2","doi-asserted-by":"publisher","first-page":"722","DOI":"10.1109\/TITS.2020.3023541","volume":"23","author":"Y Cui","year":"2021","unstructured":"Cui, Y., Chen, R., Chu, W., Chen, L., Tian, D., Li, Y., et al.: Deep learning for image and point cloud fusion in autonomous driving: A review. IEEE Trans. Intell. Transp. Syst. 23(2), 722\u2013739 (2021)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"1777_CR3","doi-asserted-by":"publisher","first-page":"2096","DOI":"10.1109\/TMM.2022.3177942","volume":"26","author":"YL Jin","year":"2022","unstructured":"Jin, Y.L., Ji, Z.Y., Zeng, D., Zhang, X.P.: VWP: An efficient DRL-based autonomous driving model. IEEE Trans. Multimed. 26, 2096\u20132108 (2022)","journal-title":"IEEE Trans. Multimed."},{"issue":"11","key":"1777_CR4","doi-asserted-by":"publisher","first-page":"19954","DOI":"10.1109\/TITS.2022.3182410","volume":"23","author":"J Chen","year":"2022","unstructured":"Chen, J., Wang, Q., Cheng, H.H., Peng, W., Xu, W.: A review of vision-based traffic semantic understanding in ITSs. IEEE Trans. Intell. Transp. Syst. 23(11), 19954\u201319979 (2022)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"8","key":"1777_CR5","doi-asserted-by":"publisher","first-page":"1283","DOI":"10.3390\/rs12081283","volume":"12","author":"W Tao","year":"2020","unstructured":"Tao, W., Hua, X., Chen, Z., Tian, P.: Fast and automatic registration of terrestrial point clouds using 2D line features. Remote Sens. 12(8), 1283 (2020)","journal-title":"Remote Sens."},{"key":"1777_CR6","doi-asserted-by":"publisher","first-page":"5410","DOI":"10.1109\/TMM.2023.3333206","volume":"26","author":"Y Hu","year":"2024","unstructured":"Hu, Y., Gao, J., Dong, J., Fan, B., Liu, H.: Exploring rich semantics for open-set action recognition. IEEE Trans. Multimed. 26, 5410\u20135421 (2024). https:\/\/doi.org\/10.1109\/TMM.2023.3333206","journal-title":"IEEE Trans. Multimed."},{"issue":"12","key":"1777_CR7","doi-asserted-by":"publisher","first-page":"15949","DOI":"10.1109\/TPAMI.2023.3311447","volume":"45","author":"J Gao","year":"2023","unstructured":"Gao, J., Chen, M., Xu, C.: Vectorized evidential learning for weakly-supervised temporal action localization. IEEE Trans. Pattern Anal. Mach. Intell. 45(12), 15949\u201315963 (2023). https:\/\/doi.org\/10.1109\/TPAMI.2023.3311447","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1777_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121306","volume":"237","author":"S Chai","year":"2024","unstructured":"Chai, S., Wang, S., Liu, C., Liu, X., Liu, T., Yang, R.: A visual measurement algorithm for vibration displacement of rotating body using semantic segmentation network. Expert Syst. Appl. 237, 121306 (2024)","journal-title":"Expert Syst. Appl."},{"key":"1777_CR9","doi-asserted-by":"publisher","DOI":"10.3389\/fenvs.2022.996513","volume":"10","author":"D Yang","year":"2022","unstructured":"Yang, D., Zhu, T., Wang, S., Wang, S., Xiong, Z.: LFRSNet: A robust light field semantic segmentation network combining contextual and geometric features. Front. Environ. Sci. 10, 996513 (2022)","journal-title":"Front. Environ. Sci."},{"key":"1777_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TIM.2023.3341127","volume":"73","author":"D Zhao","year":"2024","unstructured":"Zhao, D., Zhou, H., Chen, P., Hu, Y., Ge, W., Dang, Y., et al.: Design of forward-looking sonar system for real-time image segmentation with light multiscale attention net. IEEE Trans. Instrum. Meas. 73, 1\u201317 (2024). https:\/\/doi.org\/10.1109\/TIM.2023.3341127","journal-title":"IEEE Trans. Instrum. Meas."},{"key":"1777_CR11","first-page":"77","volume":"2016","author":"C Qi","year":"2017","unstructured":"Qi, C., Su, H., Mo, K., Guibas, L.J.: PointNet: deep learning on point sets for 3D classification and segmentation. IEEE Conf. Comput. Vis. Pattern Recogn. 2016, 77\u201385 (2017)","journal-title":"IEEE Conf. Comput. Vis. Pattern Recogn."},{"key":"1777_CR12","unstructured":"Qi, C.R., Yi, L., Su, H., Guibas, L.J.: Pointnet++: Deep hierarchical feature learning on point sets in a metric space. Adv. Neural Inf Process Syst. 30 (2017)"},{"key":"1777_CR13","doi-asserted-by":"crossref","unstructured":"Meng, H.Y., Gao, L., Lai, Y.K., Manocha, D.: Vv-net: Voxel vae net with group convolutions for point cloud segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision. pp. 8500\u20138508 (2019)","DOI":"10.1109\/ICCV.2019.00859"},{"key":"1777_CR14","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Tuzel, O.: Voxelnet: End-to-end learning for point cloud based 3d object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 4490\u20134499 (2018)","DOI":"10.1109\/CVPR.2018.00472"},{"issue":"4","key":"1777_CR15","first-page":"1","volume":"36","author":"PS Wang","year":"2017","unstructured":"Wang, P.S., Liu, Y., Guo, Y.X., Sun, C.Y., Tong, X.: O-cnn: Octree-based convolutional neural networks for 3d shape analysis. ACM Trans. Graph. (TOG). 36(4), 1\u201311 (2017)","journal-title":"ACM Trans. Graph. (TOG)."},{"key":"1777_CR16","doi-asserted-by":"crossref","unstructured":"Klokov, R., Lempitsky, V.: Escape from cells: Deep kd-networks for the recognition of 3d point cloud models. In: Proceedings of the IEEE international conference on computer vision. pp. 863\u2013872 (2017)","DOI":"10.1109\/ICCV.2017.99"},{"issue":"7","key":"1777_CR17","doi-asserted-by":"publisher","first-page":"2403","DOI":"10.1109\/TVCG.2018.2887262","volume":"26","author":"T Shao","year":"2018","unstructured":"Shao, T., Yang, Y., Weng, Y., Hou, Q., Zhou, K.: H-CNN: Spatial hashing based CNN for 3D shape analysis. IEEE Trans. Visual Comput. Graphics 26(7), 2403\u20132416 (2018)","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"1777_CR18","doi-asserted-by":"crossref","unstructured":"Choy, C., Gwak, J., Savarese, S.: 4d spatio-temporal convnets: Minkowski convolutional neural networks. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp. 3075\u20133084 (2019)","DOI":"10.1109\/CVPR.2019.00319"},{"key":"1777_CR19","doi-asserted-by":"crossref","unstructured":"Graham, B., Engelcke, M., Van Der\u00a0Maaten, L.: 3d semantic segmentation with submanifold sparse convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 9224\u20139232 (2018)","DOI":"10.1109\/CVPR.2018.00961"},{"key":"1777_CR20","doi-asserted-by":"crossref","unstructured":"Chen, X., Ma, H., Wan, J., Li, B., Xia, T.: Multi-view 3d object detection network for autonomous driving. In: Proceedings of the IEEE conference on Computer Vision and Pattern Recognition. pp. 1907\u20131915 (2017)","DOI":"10.1109\/CVPR.2017.691"},{"key":"1777_CR21","doi-asserted-by":"crossref","unstructured":"Dai, Z., Yang, Z., Yang, Y., Carbonell, J., Le, Q.V., Salakhutdinov, R.: Transformer-xl: attentive language models beyond a fixed-length context. arXiv preprint arXiv:1901.02860. (2019)","DOI":"10.18653\/v1\/P19-1285"},{"key":"1777_CR22","doi-asserted-by":"crossref","unstructured":"Lang, A.H., Vora, S., Caesar, H., Zhou, L., Yang, J., Beijbom, O.: Pointpillars: Fast encoders for object detection from point clouds. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition . pp. 12697\u201312705 (2019)","DOI":"10.1109\/CVPR.2019.01298"},{"key":"1777_CR23","doi-asserted-by":"crossref","unstructured":"Tatarchenko, M., Park, J., Koltun, V., Zhou, Q.Y.: Tangent convolutions for dense prediction in 3d. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 3887\u20133896 (2018)","DOI":"10.1109\/CVPR.2018.00409"},{"key":"1777_CR24","doi-asserted-by":"crossref","unstructured":"Huang, J., Zhang, H., Yi, L., Funkhouser, T., Nie\u00dfner, M., Guibas, L.J.: Texturenet: Consistent local parametrizations for learning from high-resolution signals on meshes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 4440\u20134449 (2019)","DOI":"10.1109\/CVPR.2019.00457"},{"key":"1777_CR25","doi-asserted-by":"crossref","unstructured":"Lin, Y., Yan, Z., Huang, H., Du, D., Liu, L., Cui, S., et\u00a0al.: Fpconv: Learning local flattening for point convolution. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp. 4293\u20134302 (2020)","DOI":"10.1109\/CVPR42600.2020.00435"},{"key":"1777_CR26","doi-asserted-by":"crossref","unstructured":"Yang, Y., Liu, S., Pan, H., Liu, Y., Tong, X.: PFCNN: Convolutional neural networks on 3D surfaces using parallel frames. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 13578\u201313587 (2020)","DOI":"10.1109\/CVPR42600.2020.01359"},{"issue":"11","key":"1777_CR27","first-page":"8338","volume":"44","author":"Q Hu","year":"2021","unstructured":"Hu, Q., Yang, B., Xie, L., Rosa, S., Guo, Y., Wang, Z., et al.: Learning semantic segmentation of large-scale point clouds with random sampling. IEEE Trans. Pattern Anal. Mach. Intell. 44(11), 8338\u20138354 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1777_CR28","first-page":"9613","volume":"2018","author":"W Wu","year":"2019","unstructured":"Wu, W., Qi, Z., Li, F.: PointConv: deep convolutional networks on 3D point clouds. IEEE\/CVF Conf. Comput. Vis. Pattern Recogn.. 2018, 9613\u20139622 (2019)","journal-title":"IEEE\/CVF Conf. Comput. Vis. Pattern Recogn.."},{"key":"1777_CR29","unstructured":"Li, Y., Bu, R., Sun, M., Wu, W., Di, X., Chen, B.: PointCNN: convolution on X-transformed points. In: Proceedings of the 32nd International Conference on Neural Information Processing Systems. pp. 828\u2013838 (2018)"},{"key":"1777_CR30","doi-asserted-by":"crossref","unstructured":"Dovrat, O., Lang, I., Avidan, S.: Learning to sample. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 2760\u20132769 (2019)","DOI":"10.1109\/CVPR.2019.00287"},{"key":"1777_CR31","doi-asserted-by":"crossref","unstructured":"Thomas, H., Qi, C.R., Deschaud, J.E., Marcotegui, B., Goulette, F., Guibas, L.J.: Kpconv: Flexible and deformable convolution for point clouds. In: Proceedings of the IEEE\/CVF international conference on computer vision. pp. 6411\u20136420 (2019)","DOI":"10.1109\/ICCV.2019.00651"},{"key":"1777_CR32","unstructured":"Defferrard, M., Milani, M., Gusset, F., Perraudin, N.: DeepSphere: a graph-based spherical CNN. In: International Conference on Learning Representations (2019)"},{"key":"1777_CR33","doi-asserted-by":"crossref","unstructured":"Wang, L., Huang, Y., Hou, Y., Zhang, S., Shan, J.: Graph attention convolution for point cloud semantic segmentation. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE Computer Society. pp. 10288\u201310297 (2019)","DOI":"10.1109\/CVPR.2019.01054"},{"key":"1777_CR34","doi-asserted-by":"crossref","unstructured":"Zhou, H., Feng, Y., Fang, M., Wei, M., Qin, J., Lu, T.: Adaptive Graph Convolution for Point Cloud Analysis. In: 2021 IEEE\/CVF International Conference on Computer Vision. IEEE. pp. 4945\u20134954 (2021)","DOI":"10.1109\/ICCV48922.2021.00492"},{"key":"1777_CR35","doi-asserted-by":"crossref","unstructured":"Yang, J., Zhang, Q., Ni, B., Li, L., Liu, J., Zhou, M., et\u00a0al.: Modeling Point Clouds With Self-Attention and Gumbel Subset Sampling. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE. pp. 3318\u20133327 (2019)","DOI":"10.1109\/CVPR.2019.00344"},{"key":"1777_CR36","doi-asserted-by":"crossref","unstructured":"Zhao, H., Jiang, L., Jia, J., Torr, P.H., Koltun, V.: Point transformer. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. pp. 16259\u201316268 (2021)","DOI":"10.1109\/ICCV48922.2021.01595"},{"key":"1777_CR37","doi-asserted-by":"crossref","unstructured":"Lai, X., Liu, J., Jiang, L., Wang, L., Zhao, H., Liu, S., et\u00a0al.: Stratified transformer for 3D point cloud segmentation. In: 35th IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE; 2022. pp. 8490\u20138499","DOI":"10.1109\/CVPR52688.2022.00831"},{"key":"1777_CR38","doi-asserted-by":"crossref","unstructured":"Yan, X., Zheng, C., Li, Z., Wang, S., Cui, S.: PointASNL: Robust point clouds processing using nonlocal neural networks with adaptive sampling. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE Computer Society. pp. 5588\u20135597 (2020)","DOI":"10.1109\/CVPR42600.2020.00563"},{"key":"1777_CR39","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1007\/s41095-021-0229-5","volume":"7","author":"MH Guo","year":"2021","unstructured":"Guo, M.H., Cai, J.X., Liu, Z.N., Mu, T.J., Martin, R.R., Hu, S.M.: Pct: point cloud transformer. Comput. Vis. Media. 7, 187\u2013199 (2021)","journal-title":"Comput. Vis. Media."},{"key":"1777_CR40","doi-asserted-by":"crossref","unstructured":"Park, J., Lee, S., Kim, S., Xiong, Y., Kim, H.J.: Self-positioning point-based transformer for point cloud understanding. In: 2023 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE. pp. 21814\u201321823 (2023)","DOI":"10.1109\/CVPR52729.2023.02089"},{"key":"1777_CR41","doi-asserted-by":"crossref","unstructured":"Armeni, I., Sener, O., Zamir, A.R., Jiang, H., Brilakis, I., Fischer, M., et\u00a0al.: 3d semantic parsing of large-scale indoor spaces. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 1534\u20131543 (2016)","DOI":"10.1109\/CVPR.2016.170"},{"key":"1777_CR42","unstructured":"Chen, M., Hu, Q., Yu, Z., Thomas, H., Feng, A., Hou, Y., et\u00a0al.: STPLS3D: A large-scale synthetic and real aerial photogrammetry 3D point cloud dataset; 2022. Publisher Copyright: 2022. The copyright of this document resides with its authors. It may be distributed unchanged freely in print or electronic forms.; 33rd British Machine Vision Conference Proceedings, BMVC 2022 ; Conference date: 21-11-2022 Through 24-11-2022"},{"key":"1777_CR43","unstructured":"Liu, Z., Tang, H., Lin, Y., Han, S.: Point-voxel CNN for efficient 3D deep learning. In: Wallach H, Larochelle H, Beygelzimer A, d\u2019Alch\u00e9-Buc F, Fox E, Garnett R, (eds). Advances in Neural Information Processing Systems. vol.\u00a032. Curran Associates, Inc.; 2019. Available from: https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2019\/file\/5737034557ef5b8c02c0e46513b98f90-Paper.pdf"},{"key":"1777_CR44","doi-asserted-by":"crossref","unstructured":"Shi, S., Guo, C., Jiang, L., Wang, Z., Shi, J., Wang, X., et\u00a0al.: Pv-rcnn: Point-voxel feature set abstraction for 3d object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp. 10529\u201310538 (2020)","DOI":"10.1109\/CVPR42600.2020.01054"},{"key":"1777_CR45","doi-asserted-by":"crossref","unstructured":"Hu, Z., Bai, X., Shang, J., Zhang, R., Dong, J., Wang, X., et\u00a0al.: Vmnet: Voxel-mesh network for geodesic-aware 3d semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. pp. 15488\u201315498 (2021)","DOI":"10.1109\/ICCV48922.2021.01520"},{"key":"1777_CR46","doi-asserted-by":"crossref","unstructured":"Riegler, G., Osman\u00a0Ulusoy, A., Geiger, A.: Octnet: Learning deep 3d representations at high resolutions. In: Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 3577\u20133586 (2017)","DOI":"10.1109\/CVPR.2017.701"},{"key":"1777_CR47","doi-asserted-by":"crossref","unstructured":"Su, H., Maji, S., Kalogerakis, E., Learned-Miller, E.: Multi-view convolutional neural networks for 3d shape recognition. In: Proceedings of the IEEE international conference on computer vision. pp. 945\u2013953 (2015)","DOI":"10.1109\/ICCV.2015.114"},{"key":"1777_CR48","unstructured":"Li, B., Zhang, T., Xia, T.: Vehicle detection from 3d lidar using fully convolutional network. arXiv preprint arXiv:1608.07916 (2016)"},{"issue":"8","key":"1777_CR49","doi-asserted-by":"publisher","first-page":"9726","DOI":"10.1109\/TPAMI.2023.3244828","volume":"45","author":"Q Zhang","year":"2023","unstructured":"Zhang, Q., Hou, J., Qian, Y., Zeng, Y., Zhang, J., He, Y.: Flattening-net: Deep regular 2d representation for 3d point cloud analysis. IEEE Trans. Pattern Anal. Mach. Intell. 45(8), 9726\u20139742 (2023)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"12","key":"1777_CR50","doi-asserted-by":"publisher","first-page":"3100","DOI":"10.1007\/s11263-022-01682-w","volume":"130","author":"Q Zhang","year":"2022","unstructured":"Zhang, Q., Hou, J., Qian, Y., Chan, A.B., Zhang, J., He, Y.: Reggeonet: Learning regular representations for large-scale 3d point clouds. Int. J. Comput. Vision 130(12), 3100\u20133122 (2022)","journal-title":"Int. J. Comput. Vision"},{"key":"1777_CR51","doi-asserted-by":"crossref","unstructured":"Zhang, R., Guo, Z., Zhang, W., Li, K., Miao, X., Cui, B., et\u00a0al.: Pointclip: point cloud understanding by clip. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp. 8552\u20138562 (2022)","DOI":"10.1109\/CVPR52688.2022.00836"},{"issue":"4","key":"1777_CR52","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3197517.3201301","volume":"37","author":"M Atzmon","year":"2018","unstructured":"Atzmon, M., Maron, H., Lipman, Y.: Point convolutional neural networks by extension operators. ACM Trans. Graph. (TOG). 37(4), 1\u201312 (2018)","journal-title":"ACM Trans. Graph. (TOG)."},{"key":"1777_CR53","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Hua, B.S., Yeung, S.K.: ShellNet: Efficient point cloud convolutional neural networks using concentric shells statistics. In: 2019 IEEE\/CVF International Conference on Computer Vision pp. 1607\u20131616 (2019)","DOI":"10.1109\/ICCV.2019.00169"},{"key":"1777_CR54","doi-asserted-by":"crossref","unstructured":"Lang, I., Manor, A., Avidan, S.: Samplenet: Differentiable point cloud sampling. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 7578\u20137588 (2020)","DOI":"10.1109\/CVPR42600.2020.00760"},{"issue":"11","key":"1777_CR55","doi-asserted-by":"publisher","first-page":"6981","DOI":"10.1109\/TCSVT.2023.3270315","volume":"33","author":"Y Qian","year":"2023","unstructured":"Qian, Y., Hou, J., Zhang, Q., Zeng, Y., Kwong, S., He, Y.: Task-oriented compact representation of 3D point clouds via a matrix optimization-driven network. IEEE Trans. Circ. Syst. Video Technol. 33(11), 6981\u20136995 (2023). https:\/\/doi.org\/10.1109\/TCSVT.2023.3270315","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"1777_CR56","doi-asserted-by":"crossref","unstructured":"Mao, J., Wang, X., Li, H.: Interpolated convolutional networks for 3d point cloud understanding. In: Proceedings of the IEEE\/CVF international conference on computer vision; pp. 1578\u20131587 (2019)","DOI":"10.1109\/ICCV.2019.00166"},{"issue":"5","key":"1777_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3326362","volume":"38","author":"Y Wang","year":"2019","unstructured":"Wang, Y., Sun, Y., Liu, Z., Sarma, S.E., Bronstein, M.M., Solomon, J.M.: Dynamic graph cnn for learning on point clouds. ACM Trans. Graph. (tog). 38(5), 1\u201312 (2019)","journal-title":"ACM Trans. Graph. (tog)."},{"key":"1777_CR58","doi-asserted-by":"crossref","unstructured":"Zhao, H., Jiang, L., Fu, C.W., Jia, J.: PointWeb: enhancing local neighborhood features for point cloud processing. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE Computer Society. pp. 5560\u20135568 (2019)","DOI":"10.1109\/CVPR.2019.00571"},{"key":"1777_CR59","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., et\u00a0al.: Attention is all you need. Adv Neural Inf Process Syst. 30, (2017)"},{"key":"1777_CR60","doi-asserted-by":"crossref","unstructured":"Park, C., Jeong, Y., Cho, M., Park, J.: Fast point transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 16949\u201316958 (2022)","DOI":"10.1109\/CVPR52688.2022.01644"},{"key":"1777_CR61","first-page":"33330","volume":"35","author":"X Wu","year":"2022","unstructured":"Wu, X., Lao, Y., Jiang, L., Liu, X., Zhao, H.: Point transformer v2: grouped vector attention and partition-based pooling. Adv. Neural. Inf. Process. Syst. 35, 33330\u201333342 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1777_CR62","doi-asserted-by":"crossref","unstructured":"Wu, X., Jiang, L., Wang, P.S., Liu, Z., Liu, X., Qiao, Y., et\u00a0al.: Point transformer V3: simpler faster stronger. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 4840\u20134851 (2024)","DOI":"10.1109\/CVPR52733.2024.00463"},{"issue":"5","key":"1777_CR63","doi-asserted-by":"publisher","first-page":"5456","DOI":"10.1109\/TITS.2023.3243643","volume":"24","author":"M Ibrahim","year":"2023","unstructured":"Ibrahim, M., Akhtar, N., Anwar, S., Mian, A.: SAT3D: Slot attention transformer for 3D point cloud semantic segmentation. IEEE Trans. Intell. Transp. Syst. 24(5), 5456\u20135466 (2023)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"9","key":"1777_CR64","doi-asserted-by":"publisher","first-page":"15824","DOI":"10.1109\/TITS.2022.3145588","volume":"23","author":"K Peng","year":"2022","unstructured":"Peng, K., Fei, J., Yang, K., Roitberg, A., Zhang, J., Bieder, F., et al.: MASS: Multi-attentional semantic segmentation of LiDAR data for dense top-view understanding. IEEE Trans. Intell. Transp. Syst. 23(9), 15824\u201315840 (2022)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"11","key":"1777_CR65","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., Urtasun, R.: Vision meets robotics: the KITTI dataset. Int. J. Rob. Res. 32(11), 1231\u20131237 (2013). https:\/\/doi.org\/10.1177\/0278364913491297","journal-title":"Int. J. Rob. Res."},{"key":"1777_CR66","doi-asserted-by":"crossref","unstructured":"Chen, D.Z., Chang, A.X., Nie\u00dfner, M.: Scanrefer: 3d object localization in rgb-d scans using natural language. In: European conference on computer vision. Springer; pp. 202\u2013221 (2020)","DOI":"10.1007\/978-3-030-58565-5_13"},{"key":"1777_CR67","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2024.3413677","volume":"62","author":"J Liu","year":"2024","unstructured":"Liu, J., Li, S., Dian, R., Song, Z., Kang, X.: MDENet: Multidomain differential excavating network for remote sensing image change detection. IEEE Trans. Geosci. Remote Sens. 62, 1\u201311 (2024). https:\/\/doi.org\/10.1109\/TGRS.2024.3413677","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"1777_CR68","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1016\/j.inffus.2022.09.030","volume":"91","author":"J Liu","year":"2023","unstructured":"Liu, J., Dian, R., Li, S., Liu, H.: SGFusion: a saliency guided deep-learning framework for pixel-level image fusion. Inf. Fusion. 91, 205\u2013214 (2023). https:\/\/doi.org\/10.1016\/j.inffus.2022.09.030","journal-title":"Inf. Fusion."},{"key":"1777_CR69","doi-asserted-by":"crossref","unstructured":"Afham, M., Dissanayake, I., Dissanayake, D., Dharmasiri, A., Thilakarathna, K., Rodrigo, R.: Crosspoint: Self-supervised cross-modal contrastive learning for 3d point cloud understanding. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition; pp. 9902\u20139912 (2022)","DOI":"10.1109\/CVPR52688.2022.00967"},{"issue":"10","key":"1777_CR70","doi-asserted-by":"publisher","first-page":"6900","DOI":"10.1109\/TVCG.2023.3345353","volume":"30","author":"Q Zhang","year":"2024","unstructured":"Zhang, Q., Hou, J.: PointVST: Self-supervised pre-training for 3D point clouds via view-specific point-to-image translation. IEEE Trans. Visual Comput. Graphics 30(10), 6900\u20136912 (2024). https:\/\/doi.org\/10.1109\/TVCG.2023.3345353","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"1777_CR71","doi-asserted-by":"publisher","unstructured":"Zhang, Q., Hou, J., Qian, Y.: PointMCD: boosting deep point cloud encoders via multi-view cross-modal distillation for 3D shape recognition. IEEE Transactions on Multimedia. pp. 1\u201314. (2023) https:\/\/doi.org\/10.1109\/TMM.2023.3286981","DOI":"10.1109\/TMM.2023.3286981"},{"key":"1777_CR72","doi-asserted-by":"crossref","unstructured":"Tang, P., Xu, H.M., Ma, C.: ProtoTransfer: cross-modal prototype transfer for point cloud segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3337\u20133347 (2023)","DOI":"10.1109\/ICCV51070.2023.00309"},{"key":"1777_CR73","doi-asserted-by":"crossref","unstructured":"Xu, M., Zhou, Z., Zhang, J., Qiao, Y.: Investigate indistinguishable points in semantic segmentation of 3d point cloud. In: Proceedings of the AAAI Conference on Artificial Intelligence. vol.\u00a035, pp. 3047\u20133055 (2021)","DOI":"10.1609\/aaai.v35i4.16413"},{"key":"1777_CR74","doi-asserted-by":"crossref","unstructured":"Hu, Z., Zhen, M., Bai, X., Fu, H., Tai, C.l.: Jsenet: Joint semantic segmentation and edge detection network for 3d point clouds. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XX 16. Springer; pp. 222\u2013239 (2020)","DOI":"10.1007\/978-3-030-58565-5_14"},{"key":"1777_CR75","doi-asserted-by":"crossref","unstructured":"Du, S., Ibrahimli, N., Stoter, J., Kooij, J., Nan, L.: Push-the-boundary: boundary-aware feature propagation for semantic segmentation of 3D point clouds. In: 2022 International Conference on 3D Vision; pp. 1\u201310 (2022)","DOI":"10.1109\/3DV57658.2022.00025"},{"key":"1777_CR76","doi-asserted-by":"crossref","unstructured":"Lan, S., Yu, R., Yu, G., Davis, L.S.: Modeling local geometric structure of 3D point clouds using Geo-CNN. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE Computer Society; 2019. pp. 998\u20131008","DOI":"10.1109\/CVPR.2019.00109"},{"key":"1777_CR77","unstructured":"Blanco, J.L., Rai, P.K.: nanoflann: a C++ header-only fork of FLANN, a library for Nearest Neighbor (NN) with KD-trees. https:\/\/github.com\/jlblancoc\/nanoflann"},{"key":"1777_CR78","doi-asserted-by":"crossref","unstructured":"Tang, L., Zhan, Y., Chen, Z., Yu, B., Tao, D.: Contrastive boundary learning for point cloud segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. pp. 8489\u20138499 (2022)","DOI":"10.1109\/CVPR52688.2022.00830"},{"key":"1777_CR79","first-page":"23192","volume":"35","author":"G Qian","year":"2022","unstructured":"Qian, G., Li, Y., Peng, H., Mai, J., Hammoud, H., Elhoseiny, M., et al.: Pointnext: Revisiting pointnet++ with improved training and scaling strategies. Adv. Neural. Inf. Process. Syst. 35, 23192\u201323204 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1777_CR80","doi-asserted-by":"crossref","unstructured":"Lin, H., Zheng, X., Li, L., Chao, F., Wang, S., Wang, Y., et\u00a0al.: Meta architecture for point cloud analysis. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition; pp. 17682\u201317691 (2023)","DOI":"10.1109\/CVPR52729.2023.01696"},{"key":"1777_CR81","doi-asserted-by":"crossref","unstructured":"Ye, X., Li, J., Huang, H., Du, L., Zhang, X.: 3D recurrent neural networks with context fusion for point cloud semantic segmentation. In: European Conference on Computer Vision; pp. 415\u2013430 (2018)","DOI":"10.1007\/978-3-030-01234-2_25"},{"key":"1777_CR82","doi-asserted-by":"crossref","unstructured":"Huang, Q., Wang, W., Neumann, U.: Recurrent slice networks for 3D segmentation of point clouds. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE. pp. 2626\u20132635 (2018)","DOI":"10.1109\/CVPR.2018.00278"},{"key":"1777_CR83","doi-asserted-by":"crossref","unstructured":"Landrieu, L., Simonovsky, M.: Large-scale point cloud semantic segmentation with superpoint graphs. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. pp. 4558\u20134567 (2018)","DOI":"10.1109\/CVPR.2018.00479"},{"key":"1777_CR84","doi-asserted-by":"crossref","unstructured":"Jiang, L., Zhao, H., Liu, S., Shen, X., Fu, C.W., Jia, J.: Hierarchical point-edge interaction network for point cloud semantic segmentation. In: 2019 IEEE\/CVF International Conference on Computer Vision. IEEE Computer Society; pp. 10432\u201310440 (2019)","DOI":"10.1109\/ICCV.2019.01053"},{"key":"1777_CR85","doi-asserted-by":"crossref","unstructured":"Fan, S., Dong, Q., Zhu, F., Lv, Y., Ye, P., Wang, F.Y.: SCF-Net: learning spatial contextual features for large-scale point cloud segmentation. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE. p. 14499\u201314508 (2021)","DOI":"10.1109\/CVPR46437.2021.01427"},{"key":"1777_CR86","doi-asserted-by":"crossref","unstructured":"Chen, C., Wang, Y., Chen, H., Yan, X., Ren, D., Guo, Y., et\u00a0al.: GeoSegNet: Point Cloud Semantic Segmentation Via Geometric Encoder\u2013Decoder Modeling. The Visual Computer. pp. 1\u201315 (2023)","DOI":"10.1007\/s00371-023-02853-7"},{"key":"1777_CR87","doi-asserted-by":"crossref","unstructured":"Qiu, S., Anwar, S., Barnes, N.: Semantic segmentation for real point cloud scenes via bilateral augmentation and adaptive fusion. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE Computer Society, pp. 1757\u20131767 (2021)","DOI":"10.1109\/CVPR46437.2021.00180"},{"key":"1777_CR88","unstructured":"Mao, Y., Sun, X., Chen, K., Diao, W., Guo, Z., Lu, X., et\u00a0al.: Semantic segmentation for point cloud scenes via dilated graph feature aggregation and pyramid decoders. arXiv preprint arXiv:2204.04944. (2022)"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-025-01777-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-025-01777-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-025-01777-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,4]],"date-time":"2025-09-04T15:03:51Z","timestamp":1756998231000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-025-01777-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,10]]},"references-count":88,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2025,6]]}},"alternative-id":["1777"],"URL":"https:\/\/doi.org\/10.1007\/s00530-025-01777-7","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,4,10]]},"assertion":[{"value":"4 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 March 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 April 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"187"}}