{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T12:33:39Z","timestamp":1778762019688,"version":"3.51.4"},"reference-count":65,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s00371-026-04444-8","type":"journal-article","created":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T16:34:23Z","timestamp":1775061263000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Deep Learning-Based Instance Segmentation: A Comprehensive Review of Algorithms, Challenges, and Future Directions"],"prefix":"10.1007","volume":"42","author":[{"given":"Jiacheng","family":"Lou","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sergei","family":"Shavetov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuecheng","family":"Wen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhidong","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chunhong","family":"Yuan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,4,1]]},"reference":[{"key":"4444_CR1","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"4444_CR2","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems (2015)"},{"key":"4444_CR3","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Maire, M., Belongie, S., et al.: Microsoft coco: Common objects in context. In: Computer vision-ECCV 2014: 13th European Conference. Zurich, Switzerland, September 6\u201312, 2014, Proceedings, Part V 13, pp. 740\u2013755. Springer, Cham (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"4444_CR4","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., et al.: Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"4444_CR5","doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., Ramos, S., et al.: The cityscapes dataset for semantic urban scene understanding. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3213\u20133223 (2016)","DOI":"10.1109\/CVPR.2016.350"},{"key":"4444_CR6","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., et al.: Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"4444_CR7","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., et al.: Path aggregation network for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"key":"4444_CR8","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Arbel\u00e1ez, P., Girshick, R., Malik, J.: Simultaneous detection and segmentation. In: European Conference on Computer Vision, pp. 297\u2013312 (2014). Springer","DOI":"10.1007\/978-3-319-10584-0_20"},{"issue":"2","key":"4444_CR9","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1016\/j.patrec.2008.04.005","volume":"30","author":"GJ Brostow","year":"2009","unstructured":"Brostow, G.J., Fauqueur, J., Cipolla, R.: Semantic object classes in video: A high-definition ground truth database. Pattern Recogn. Lett. 30(2), 88\u201397 (2009)","journal-title":"Pattern Recogn. Lett."},{"key":"4444_CR10","unstructured":"Pinheiro, P.O., Collobert, R., Doll\u00e1r, P.: Learning to segment object candidates. Advances in neural information processing systems 28 (2015)"},{"key":"4444_CR11","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/978-3-319-46448-0_5","volume-title":"Computer Vision-ECCV 2016: 14th European Conference. Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14","author":"PO Pinheiro","year":"2016","unstructured":"Pinheiro, P.O., Lin, T.Y., Collobert, R., et al.: Learning to refine object segments. In: Computer Vision-ECCV 2016: 14th European Conference. Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 75\u201391. Springer, Cham (2016)"},{"key":"4444_CR12","doi-asserted-by":"crossref","unstructured":"Chen, L.C., Hermans, A., Papandreou, G., et al.: Masklab: Instance segmentation by refining object detection with semantic and direction features. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4013\u20134022 (2018)","DOI":"10.1109\/CVPR.2018.00422"},{"key":"4444_CR13","doi-asserted-by":"crossref","unstructured":"Bolya, D., Zhou, C., Xiao, F., et al.: Yolact: Real-time instance segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9157\u20139166 (2019)","DOI":"10.1109\/ICCV.2019.00925"},{"key":"4444_CR14","doi-asserted-by":"publisher","first-page":"649","DOI":"10.1007\/978-3-030-58523-5_38","volume-title":"Computer Vision-ECCV 2020: 16th European Conference. Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XVIII 16","author":"X Wang","year":"2020","unstructured":"Wang, X., Kong, T., Shen, C., et al.: Solo: Segmenting objects by locations. In: Computer Vision-ECCV 2020: 16th European Conference. Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XVIII 16, pp. 649\u2013665. Springer, Cham (2020)"},{"key":"4444_CR15","doi-asserted-by":"crossref","unstructured":"Chen, H., Sun, K., Tian, Z., et al.: Blendmask: Top-down meets bottom-up for instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8573\u20138581 (2020)","DOI":"10.1109\/CVPR42600.2020.00860"},{"key":"4444_CR16","doi-asserted-by":"crossref","unstructured":"Fang, Y., Yang, S., Wang, X., et al.: Instances as queries. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6910\u20136919 (2021)","DOI":"10.1109\/ICCV48922.2021.00683"},{"key":"4444_CR17","doi-asserted-by":"crossref","unstructured":"Cheng, B., Misra, I., Schwing, A.G., et al.: Masked-attention mask transformer for universal image segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1290\u20131299 (2022)","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"4444_CR18","doi-asserted-by":"crossref","unstructured":"Li, F., Zhang, H., Xu, H., et al.: Mask dino: Towards a unified transformer-based framework for object detection and segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3041\u20133050 (2023)","DOI":"10.1109\/CVPR52729.2023.00297"},{"key":"4444_CR19","unstructured":"Bommasani, R., Hudson, D.A., Adeli, E., Altman, R., Arora, S., Arx, S., Bernstein, M.S., Bohg, J., Bosselut, A., Brunskill, E., et al.: On the opportunities and risks of foundation models. arXiv preprint arXiv:2108.07258 (2021)"},{"key":"4444_CR20","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Mintun, E., Ravi, N., et al.: Segment anything. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4015\u20134026 (2023)","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"4444_CR21","first-page":"19769","volume":"36","author":"X Zou","year":"2023","unstructured":"Zou, X., Yang, J., Zhang, H., et al.: Segment everything everywhere all at once. Adv. Neural. Inf. Process. Syst. 36, 19769\u201319782 (2023)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"4444_CR22","doi-asserted-by":"crossref","unstructured":"Gupta, A., Dollar, P., Girshick, R.: Lvis: A dataset for large vocabulary instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5356\u20135364 (2019)","DOI":"10.1109\/CVPR.2019.00550"},{"issue":"11","key":"4444_CR23","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., et al.: Vision meets robotics: The kitti dataset. The Int. J. Robot. Res. 32(11), 1231\u20131237 (2013)","journal-title":"The Int. J. Robot. Res."},{"key":"4444_CR24","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Wu, Y., He, K., et al.: Pointrend: Image segmentation as rendering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9799\u20139808 (2020)","DOI":"10.1109\/CVPR42600.2020.00982"},{"key":"4444_CR25","doi-asserted-by":"publisher","first-page":"282","DOI":"10.1007\/978-3-030-58452-8_17","volume-title":"Computer Vision-ECCV 2020: 16th European Conference. Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I 16","author":"Z Tian","year":"2020","unstructured":"Tian, Z., Shen, C., Chen, H.: Conditional convolutions for instance segmentation. In: Computer Vision-ECCV 2020: 16th European Conference. Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I 16, pp. 282\u2013298. Springer, Cham (2020)"},{"issue":"1","key":"4444_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-019-0197-0","volume":"6","author":"C Shorten","year":"2019","unstructured":"Shorten, C., Khoshgoftaar, T.M.: A survey on image data augmentation for deep learning. J Big Data 6(1), 1\u201348 (2019)","journal-title":"J Big Data"},{"issue":"7","key":"4444_CR27","first-page":"3523","volume":"44","author":"S Minaee","year":"2021","unstructured":"Minaee, S., Boykov, Y., Porikli, F., Plaza, A., Kehtarnavaz, N., Terzopoulos, D.: Image segmentation using deep learning: A survey. IEEE Trans. Pattern Anal. Mach. Intell. 44(7), 3523\u20133542 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4444_CR28","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2022.104401","volume":"120","author":"W Gu","year":"2022","unstructured":"Gu, W., Bai, S., Kong, L.: A review on 2d instance segmentation based on deep neural networks. Image Vis. Comput. 120, 104401 (2022)","journal-title":"Image Vis. Comput."},{"key":"4444_CR29","unstructured":"Ren, T., Liu, S., Zeng, A., et al.: Grounded SAM: Assembling Open-World Models for Diverse Visual Tasks. arXiv:2401.14159 (2024)"},{"key":"4444_CR30","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Wang, X., et al.: Boxinst: High-performance instance segmentation with box annotations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5443\u20135452 (2021)","DOI":"10.1109\/CVPR46437.2021.00540"},{"key":"4444_CR31","doi-asserted-by":"crossref","unstructured":"Wang, X., Zhao, K., Zhang, R., et al.: Contrastmask: Contrastive learning to segment every thing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11604\u201311613 (2022)","DOI":"10.1109\/CVPR52688.2022.01131"},{"issue":"2","key":"4444_CR32","doi-asserted-by":"publisher","first-page":"1108","DOI":"10.1109\/TPAMI.2020.3014297","volume":"44","author":"D Bolya","year":"2022","unstructured":"Bolya, D., Zhou, C., Xiao, F., Lee, Y.J.: Yolact++ better real-time instance segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 44(2), 1108\u20131121 (2022). https:\/\/doi.org\/10.1109\/TPAMI.2020.3014297","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"20","key":"4444_CR33","doi-asserted-by":"publisher","first-page":"9332","DOI":"10.3390\/app14209332","volume":"14","author":"MF Senussi","year":"2024","unstructured":"Senussi, M.F., Kang, H.-S.: Occlusion removal in light-field images using cspdarknet53 and bidirectional feature pyramid network: A multi-scale fusion-based approach. Appl. Sci. 14(20), 9332 (2024)","journal-title":"Appl. Sci."},{"issue":"1","key":"4444_CR34","doi-asserted-by":"publisher","first-page":"36978","DOI":"10.1038\/s41598-025-20786-0","volume":"15","author":"MF Senussi","year":"2025","unstructured":"Senussi, M.F., Abdalla, M., Kasem, M.S., Mahmoud, M., Kang, H.-S.: Learning to remove occlusions in light field images using multiscale receptive fields and feature pyramid networks. Sci. Rep. 15(1), 36978 (2025)","journal-title":"Sci. Rep."},{"key":"4444_CR35","doi-asserted-by":"crossref","unstructured":"Kasem, M.S., Mahmoud, M., Senussi, M.F., Abdalla, M., Kang, H.-S.: Attention-guided hybrid learning for accurate defect classification in manufacturing environments. Scientific Reports (2025)","DOI":"10.1038\/s41598-025-31654-2"},{"key":"4444_CR36","doi-asserted-by":"crossref","unstructured":"Liu, S., Jia, J., Fidler, S., et al.: Sgn: Sequential grouping networks for instance segmentation. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 3496\u20133504 (2017)","DOI":"10.1109\/ICCV.2017.378"},{"key":"4444_CR37","doi-asserted-by":"crossref","unstructured":"Peng, S., Jiang, W., Pi, H., et al.: Deep snake for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8533\u20138542 (2020)","DOI":"10.1109\/CVPR42600.2020.00856"},{"key":"4444_CR38","doi-asserted-by":"crossref","unstructured":"Zhang, G., Lu, X., Tan, J., et al.: Refinemask: Towards high-quality instance segmentation with fine-grained features. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6861\u20136869 (2021)","DOI":"10.1109\/CVPR46437.2021.00679"},{"key":"4444_CR39","first-page":"2701","volume":"35","author":"T Vu","year":"2021","unstructured":"Vu, T., Kang, H., Yoo, C.D.: Scnet: Training inference sample consistency for instance segmentation. Proceed. AAAI Confer. Artific. Intell. 35, 2701\u20132709 (2021)","journal-title":"Proceed. AAAI Confer. Artific. Intell."},{"key":"4444_CR40","doi-asserted-by":"crossref","unstructured":"Ke, L., Danelljan, M., Li, X., et al.: Mask transfiner for high-quality instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4412\u20134421 (2022)","DOI":"10.1109\/CVPR52688.2022.00437"},{"key":"4444_CR41","doi-asserted-by":"publisher","first-page":"534","DOI":"10.1007\/978-3-319-46466-4_32","volume-title":"Computer Vision-ECCV 2016: 14th European Conference. Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part VI 14","author":"J Dai","year":"2016","unstructured":"Dai, J., He, K., Li, Y., et al.: Instance-sensitive fully convolutional networks. In: Computer Vision-ECCV 2016: 14th European Conference. Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part VI 14, pp. 534\u2013549. Springer, Cham (2016)"},{"key":"4444_CR42","doi-asserted-by":"crossref","unstructured":"Xie, E., Sun, P., Song, X., et al.: Polarmask: Single shot instance segmentation with polar representation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12193\u201312202 (2020)","DOI":"10.1109\/CVPR42600.2020.01221"},{"key":"4444_CR43","doi-asserted-by":"crossref","unstructured":"Gao, N., Shan, Y., Wang, Y., et al.: Ssap: Single-shot instance segmentation with affinity pyramid. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 642\u2013651 (2019)","DOI":"10.1109\/ICCV.2019.00073"},{"key":"4444_CR44","first-page":"17721","volume":"33","author":"X Wang","year":"2020","unstructured":"Wang, X., Zhang, R., Kong, T., et al.: Solov2: Dynamic and fast instance segmentation. Adv. Neural. Inf. Process. Syst. 33, 17721\u201317732 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"4444_CR45","doi-asserted-by":"crossref","unstructured":"Lee, Y., Park, J.: Centermask: Real-time anchor-free instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13906\u201313915 (2020)","DOI":"10.1109\/CVPR42600.2020.01392"},{"key":"4444_CR46","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H., et al.: Fcos: Fully convolutional one-stage object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9627\u20139636 (2019)","DOI":"10.1109\/ICCV.2019.00972"},{"key":"4444_CR47","doi-asserted-by":"crossref","unstructured":"Chen, X., Girshick, R., He, K., et al.: Tensormask: A foundation for dense object segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2061\u20132069 (2019)","DOI":"10.1109\/ICCV.2019.00215"},{"issue":"10","key":"4444_CR48","doi-asserted-by":"publisher","first-page":"8275","DOI":"10.1007\/s00521-021-05978-9","volume":"34","author":"P Hurtik","year":"2022","unstructured":"Hurtik, P., Molek, V., Hula, J., et al.: Poly-yolo: higher speed, more precise detection and instance segmentation for yolov3. Neural Comput. Appl. 34(10), 8275\u20138290 (2022)","journal-title":"Neural Comput. Appl."},{"key":"4444_CR49","unstructured":"Redmon, J., Farhadi, A.: YOLOv3: An Incremental Improvement. arXiv:1804.02767 (2018)"},{"key":"4444_CR50","doi-asserted-by":"crossref","unstructured":"Guo, R., Niu, D., Qu, L., et al.: Sotr: Segmenting objects with transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7157\u20137166 (2021)","DOI":"10.1109\/ICCV48922.2021.00707"},{"key":"4444_CR51","unstructured":"Hu, J., Cao, L., Lu, Y., et al.: ISTR: End-to-End Instance Segmentation with Transformers. arXiv preprint arXiv:2105.00637 (2021)"},{"key":"4444_CR52","first-page":"10326","volume":"34","author":"W Zhang","year":"2021","unstructured":"Zhang, W., Pang, J., Chen, K., et al.: K-net: Towards unified image segmentation. Adv. Neural. Inf. Process. Syst. 34, 10326\u201310338 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"4444_CR53","doi-asserted-by":"crossref","unstructured":"Zhang, T., Wei, S., Ji, S.: E2ec: An end-to-end contour-based method for high-quality high-speed instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4443\u20134452 (2022)","DOI":"10.1109\/CVPR52688.2022.00440"},{"key":"4444_CR54","doi-asserted-by":"crossref","unstructured":"Zang, Y., Huang, C., Loy, C.C.: Fasa: Feature augmentation and sampling adaptation for long-tailed instance segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3457\u20133466 (2021)","DOI":"10.1109\/ICCV48922.2021.00344"},{"key":"4444_CR55","doi-asserted-by":"publisher","first-page":"196654","DOI":"10.1109\/ACCESS.2025.3634156","volume":"13","author":"M Hayat","year":"2025","unstructured":"Hayat, M., Aramvith, S.: Superpixel-guided graph-attention boundary GAN for adaptive feature refinement in scribble-supervised medical image segmentation. IEEE Access 13, 196654\u2013196668 (2025). https:\/\/doi.org\/10.1109\/ACCESS.2025.3634156","journal-title":"IEEE Access"},{"key":"4444_CR56","doi-asserted-by":"publisher","first-page":"108876","DOI":"10.1109\/ACCESS.2024.3434714","volume":"12","author":"M Hayat","year":"2024","unstructured":"Hayat, M., Aramvith, S.: Transformer\u2019s role in brain mri: A scoping review. IEEE Access 12, 108876\u2013108896 (2024). https:\/\/doi.org\/10.1109\/ACCESS.2024.3434714","journal-title":"IEEE Access"},{"key":"4444_CR57","unstructured":"Senussi, M.F., Abdalla, M., Kasem, M.S., Mahmoud, M., Kang, H.-S.: Spectral normalized u-net for light field occlusion removal. In: International Conference on Future Information & Communication Engineering, vol. 16, pp. 294\u2013297 (2025). Proceedings metadata provided by the author; verify publisher\/ISBN if required by the journal"},{"key":"4444_CR58","doi-asserted-by":"publisher","unstructured":"Senussi, M.F., Abdalla, M., Kasem, M.S., Mahmoud, M., Kang, H.-S.: TriORU2-Net++: Attention-Guided Three-Stage U2-Net++ for Light Field Occlusion Removal. Research Square preprint. Posted Jan 19, 2026 (2026). https:\/\/doi.org\/10.21203\/rs.3.rs-7599592\/v1","DOI":"10.21203\/rs.3.rs-7599592\/v1"},{"key":"4444_CR59","doi-asserted-by":"publisher","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) Computer Vision \u2013 ECCV 2020. Lecture Notes in Computer Science, vol. 12346, pp. 213\u2013229. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_13","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"4444_CR60","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., et al.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"4444_CR61","doi-asserted-by":"crossref","unstructured":"Senussi, M.F., Abdalla, M., Kasem, M.S., Mahmoud, M., Yagoub, B., Kang, H.-S.: A comprehensive review on light field occlusion removal: Trends, challenges, and future directions. IEEE Access (2025)","DOI":"10.1109\/ACCESS.2025.3548133"},{"issue":"17","key":"4444_CR62","doi-asserted-by":"publisher","first-page":"2748","DOI":"10.3390\/math13172748","volume":"13","author":"MF Senussi","year":"2025","unstructured":"Senussi, M.F., Abdalla, M., Kasem, M.S., Mahmoud, M., Kang, H.-S.: U2-lfor: A two-stage u2 network for light-field occlusion removal. Mathematics 13(17), 2748 (2025)","journal-title":"Mathematics"},{"key":"4444_CR63","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S.M.A., Van Gool, L., et al.: The pascal visual object classes challenge: A retrospective. Int. J. Comput. Vision 111, 98\u2013136 (2015)","journal-title":"Int. J. Comput. Vision"},{"issue":"23","key":"4444_CR64","doi-asserted-by":"publisher","DOI":"10.1088\/1361-6560\/abc363","volume":"65","author":"W Chi","year":"2020","unstructured":"Chi, W., Ma, L., Wu, J., Chen, M., Lu, W., Gu, X.: Deep learning-based medical image segmentation with limited labels. Phys. Med. Biol. 65(23), 235001 (2020)","journal-title":"Phys. Med. Biol."},{"issue":"1","key":"4444_CR65","doi-asserted-by":"publisher","first-page":"85","DOI":"10.3390\/math14010085","volume":"14","author":"EH Khujamatov","year":"2025","unstructured":"Khujamatov, E.H., Abdullaev, M., Umirzakova, S.: Analytical modeling of hybrid cnn-transformer dynamics for emotion classification. Mathematics 14(1), 85 (2025)","journal-title":"Mathematics"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-026-04444-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-026-04444-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-026-04444-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T13:17:26Z","timestamp":1777468646000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-026-04444-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":65,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["4444"],"URL":"https:\/\/doi.org\/10.1007\/s00371-026-04444-8","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]},"assertion":[{"value":"5 January 2026","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 March 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 April 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to participate"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"Not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code availability"}},{"value":"The authors declare no conflict of interest.","order":6,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"235"}}