{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T00:18:58Z","timestamp":1777940338346,"version":"3.51.4"},"reference-count":64,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T00:00:00Z","timestamp":1777680000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T00:00:00Z","timestamp":1777680000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the Humanities and Social Sciences Research Program of Chongqing Municipal Education Commission","award":["No. 23SKGH263"],"award-info":[{"award-number":["No. 23SKGH263"]}]},{"name":"the Science and Technology Research Program of Chongqing Municipal Education Commission","award":["No. KJQN202201148"],"award-info":[{"award-number":["No. KJQN202201148"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s10044-026-01680-5","type":"journal-article","created":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T05:45:46Z","timestamp":1777700746000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Interaction-guided attention and local region refinement for interactive image segmentation"],"prefix":"10.1007","volume":"29","author":[{"given":"Jianwu","family":"Long","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shaoyi","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuanqin","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,5,2]]},"reference":[{"key":"1680_CR1","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, Hu H, Wei Y, Zhang Z, Lin S, Guo B (2021) Swin transformer: Hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 10012\u201310022","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"1680_CR2","doi-asserted-by":"crossref","unstructured":"Sun K, Xiao B, Liu D, Wang J (2019) Deep high-resolution representation learning for human pose estimation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5693\u20135703","DOI":"10.1109\/CVPR.2019.00584"},{"key":"1680_CR3","doi-asserted-by":"crossref","unstructured":"Chen L-C, Zhu Y, Papandreou G, Schroff F, Adam H (2018) Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Proceedings of the European conference on computer vision (ECCV), pp 801\u2013818","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"1680_CR4","doi-asserted-by":"crossref","unstructured":"Zhou Z, Rahman\u00a0Siddiquee MM, Tajbakhsh N, Liang J (2018) Unet++: A nested u-net architecture for medical image segmentation. In: Deep learning in medical image analysis and multimodal learning for clinical decision support: 4th international workshop, DLMIA 2018, and 8th International Workshop, ML-CDS 2018, Held in Conjunction with MICCAI 2018, Granada, Spain, September 20, 2018, Proceedings 4. Springer, pp 3\u201311","DOI":"10.1007\/978-3-030-00889-5_1"},{"key":"1680_CR5","first-page":"12077","volume":"34","author":"E Xie","year":"2021","unstructured":"Xie E, Wang W, Yu Z, Anandkumar A, Alvarez JM, Luo P (2021) Segformer: simple and efficient design for semantic segmentation with transformers. Adv Neural Inf Process Syst 34:12077\u201312090","journal-title":"Adv Neural Inf Process Syst"},{"key":"1680_CR6","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham M, Van Gool L, Williams CK, Winn J, Zisserman A (2010) The pascal visual object classes (voc) challenge. Int J Comput Vis 88:303\u2013338","journal-title":"Int J Comput Vis"},{"key":"1680_CR7","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Maire M, Belongie S, Hays J, Perona P, Ramanan D, Doll\u00e1r P, Zitnick CL (2014) Microsoft coco: Common objects in context. In: Computer vision\u2013ECCV 2014: 13th European conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13. Springer, pp 740\u2013755","DOI":"10.1007\/978-3-319-10602-1_48"},{"issue":"1","key":"1680_CR8","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1146\/annurev-bioeng-071516-044442","volume":"19","author":"D Shen","year":"2017","unstructured":"Shen D, Wu G, Suk H-I (2017) Deep learning in medical image analysis. Annu Rev Biomed Eng 19(1):221\u2013248","journal-title":"Annu Rev Biomed Eng"},{"key":"1680_CR9","doi-asserted-by":"publisher","first-page":"9402","DOI":"10.1109\/TIP.2021.3125491","volume":"30","author":"J Deng","year":"2021","unstructured":"Deng J, Xie X (2021) 3d interactive segmentation with semi-implicit representation and active learning. IEEE Trans Image Process 30:9402\u20139417","journal-title":"IEEE Trans Image Process"},{"issue":"2","key":"1680_CR10","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1007\/s11263-006-7934-5","volume":"70","author":"Y Boykov","year":"2006","unstructured":"Boykov Y, Funka-Lea G (2006) Graph cuts and efficient nd image segmentation. Int J Comput Vis 70(2):109\u2013131","journal-title":"Int J Comput Vis"},{"key":"1680_CR11","doi-asserted-by":"crossref","unstructured":"Gulshan V, Rother C, Criminisi A, Blake A, Zisserman A (2010) Geodesic star convexity for interactive image segmentation. In: 2010 IEEE computer society conference on computer vision and pattern recognition. IEEE, pp 3129\u20133136","DOI":"10.1109\/CVPR.2010.5540073"},{"key":"1680_CR12","doi-asserted-by":"crossref","unstructured":"Zhang S, Liew JH, Wei Y, Wei S, Zhao Y (2020) Interactive object segmentation with inside-outside guidance. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 12234\u201312244","DOI":"10.1109\/CVPR42600.2020.01225"},{"key":"1680_CR13","doi-asserted-by":"crossref","unstructured":"Li K, Vosselman G, Yang MY (2023) Interactive image segmentation with cross-modality vision transformers. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 762\u2013772","DOI":"10.1109\/ICCVW60793.2023.00084"},{"key":"1680_CR14","doi-asserted-by":"crossref","unstructured":"Lee C, Lee S-H, Kim C-S (2024) Mfp: Making full use of probability maps for interactive image segmentation. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition (CVPR). IEEE, pp 4051\u20134059","DOI":"10.1109\/CVPR52733.2024.00388"},{"key":"1680_CR15","doi-asserted-by":"crossref","unstructured":"Lin J, Chen J, Yang K, Roitberg A, Li S, Li Z, Li S (2024) Adaptiveclick: Click-aware transformer with adaptive focal loss for interactive image segmentation. IEEE Trans Neural Netw Learn Syst","DOI":"10.1109\/TNNLS.2024.3378295"},{"key":"1680_CR16","doi-asserted-by":"crossref","unstructured":"Chen X, Zhao Z, Yu F, Zhang Y, Duan M (2021) Conditional diffusion for interactive segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 7345\u20137354","DOI":"10.1109\/ICCV48922.2021.00725"},{"key":"1680_CR17","doi-asserted-by":"crossref","unstructured":"Chen X, Zhao Z, Zhang Y, Duan M, Qi D, Zhao H (2022) Focalclick: Towards practical interactive image segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 1300\u20131309","DOI":"10.1109\/CVPR52688.2022.00136"},{"key":"1680_CR18","doi-asserted-by":"crossref","unstructured":"Xu N, Price B, Cohen S, Yang J, Huang TS (2016) Deep interactive object selection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 373\u2013381","DOI":"10.1109\/CVPR.2016.47"},{"key":"1680_CR19","doi-asserted-by":"crossref","unstructured":"Wei Q, Zhang H, Yong J-H (2023) Focused and collaborative feedback integration for interactive image segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 18643\u201318652","DOI":"10.1109\/CVPR52729.2023.01788"},{"key":"1680_CR20","doi-asserted-by":"crossref","unstructured":"Lin Z, Zhang Z, Chen L-Z, Cheng M-M, Lu S-P (2020) Interactive image segmentation with first click attention. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 13339\u201313348","DOI":"10.1109\/CVPR42600.2020.01335"},{"key":"1680_CR21","doi-asserted-by":"crossref","unstructured":"Sofiiuk K, Petrov I, Barinova O, Konushin A (2020) f-brs: Rethinking backpropagating refinement for interactive segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 8623\u20138632","DOI":"10.1109\/CVPR42600.2020.00865"},{"key":"1680_CR22","doi-asserted-by":"crossref","unstructured":"Sofiiuk K, Petrov IA, Konushin A (2022) Reviving iterative training with mask guidance for interactive segmentation. In: 2022 IEEE international conference on image processing (ICIP). IEEE, pp 3141\u20133145","DOI":"10.1109\/ICIP46576.2022.9897365"},{"key":"1680_CR23","unstructured":"Mahadevan S, Voigtlaender P, Leibe B (2018) Iteratively trained interactive segmentation. arXiv preprint arXiv:1805.04398"},{"key":"1680_CR24","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1016\/j.neunet.2018.10.009","volume":"109","author":"Y Hu","year":"2019","unstructured":"Hu Y, Soltoggio A, Lock R, Carter S (2019) A fully convolutional two-stream fusion network for interactive image segmentation. Neural Netw 109:31\u201342","journal-title":"Neural Netw"},{"key":"1680_CR25","doi-asserted-by":"crossref","unstructured":"Long J, Liu Y, Wang S, Chen S, Luo Q (2025) Fusing multi-stage clicks with deep feedback aggregation for interactive image segmentation. Comput Gr:104445","DOI":"10.1016\/j.cag.2025.104445"},{"key":"1680_CR26","doi-asserted-by":"crossref","unstructured":"Yuan Y, Chen X, Wang J (2020) Object-contextual representations for semantic segmentation. In: Computer vision\u2013ECCV 2020: 16th European conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part VI 16. Springer, pp 173\u2013190","DOI":"10.1007\/978-3-030-58539-6_11"},{"key":"1680_CR27","doi-asserted-by":"crossref","unstructured":"Xu N, Price B, Cohen S, Yang J, Huang T (2017) Deep grabcut for object selection. arXiv preprint arXiv:1707.00243","DOI":"10.5244\/C.31.182"},{"key":"1680_CR28","doi-asserted-by":"crossref","unstructured":"Lempitsky V, Kohli P, Rother C, Sharp T (2009) Image segmentation with a bounding box prior. In: 2009 IEEE 12th international conference on computer vision. IEEE, pp 277\u2013284","DOI":"10.1109\/ICCV.2009.5459262"},{"issue":"3","key":"1680_CR29","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1145\/1015706.1015720","volume":"23","author":"C Rother","year":"2004","unstructured":"Rother C, Kolmogorov V, Blake A (2004) \u201cgrabcut\u2019\u2019 interactive foreground extraction using iterated graph cuts. ACM Trans Gr (TOG) 23(3):309\u2013314","journal-title":"ACM Trans Gr (TOG)"},{"key":"1680_CR30","doi-asserted-by":"crossref","unstructured":"Wu J, Zhao Y, Zhu J-Y, Luo S, Tu Z (2014) Milcut: a sweeping line multiple instance learning paradigm for interactive image segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 256\u2013263","DOI":"10.1109\/CVPR.2014.40"},{"key":"1680_CR31","doi-asserted-by":"crossref","unstructured":"Boykov YY, Jolly M-P (2001) Interactive graph cuts for optimal boundary & region segmentation of objects in nd images. In: Proceedings eighth IEEE international conference on computer vision. ICCV 2001, vol 1. IEEE, pp 105\u2013112","DOI":"10.1109\/ICCV.2001.937505"},{"issue":"11","key":"1680_CR32","doi-asserted-by":"publisher","first-page":"1768","DOI":"10.1109\/TPAMI.2006.233","volume":"28","author":"L Grady","year":"2006","unstructured":"Grady L (2006) Random walks for image segmentation. IEEE Trans Pattern Anal Mach Intell 28(11):1768\u20131783","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"2","key":"1680_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10044-025-01432-x","volume":"28","author":"J Long","year":"2025","unstructured":"Long J, Liu Y, Zhang K, Chen S, Luo Q (2025) Interactive image segmentation combining global seeding and sparse local reconstruction. Pattern Anal Appl 28(2):1\u201323","journal-title":"Pattern Anal Appl"},{"key":"1680_CR34","doi-asserted-by":"crossref","unstructured":"Maninis K-K, Caelles S, Pont-Tuset J, Van\u00a0Gool L (2018) Deep extreme cut: from extreme points to object segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 616\u2013625","DOI":"10.1109\/CVPR.2018.00071"},{"key":"1680_CR35","doi-asserted-by":"crossref","unstructured":"Jang W-D, Kim C-S (2019) Interactive image segmentation via backpropagating refinement scheme. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5297\u20135306","DOI":"10.1109\/CVPR.2019.00544"},{"key":"1680_CR36","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Adv Neural Inf Process Syst 30"},{"key":"1680_CR37","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov, A, Weissenborn D, Zhai X, Unterthiner T, Dehghani M, Minderer M, Heigold G, Gelly S et al (2020) An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929"},{"key":"1680_CR38","doi-asserted-by":"crossref","unstructured":"Liu Q, Xu Z, Bertasius G, Niethammer M (2023) Simpleclick: interactive image segmentation with simple vision transformers. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 22290\u201322300","DOI":"10.1109\/ICCV51070.2023.02037"},{"key":"1680_CR39","doi-asserted-by":"crossref","unstructured":"He K, Chen X, Xie S, Li Y, Doll\u00e1r P, Girshick R (2022) Masked autoencoders are scalable vision learners. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 16000\u201316009","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"1680_CR40","doi-asserted-by":"crossref","unstructured":"Cui Y, Yan L, Cao Z, Liu D (2021) Tf-blender: temporal feature blender for video object detection. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 8138\u20138147","DOI":"10.1109\/ICCV48922.2021.00803"},{"issue":"10","key":"1680_CR41","doi-asserted-by":"publisher","first-page":"6642","DOI":"10.1109\/TCSVT.2022.3177320","volume":"32","author":"L Yan","year":"2022","unstructured":"Yan L, Ma S, Wang Q, Chen Y, Zhang X, Savakis A, Liu D (2022) Video captioning using global-local representation. IEEE Trans Circuits Syst Video Technol 32(10):6642\u20136656","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"1680_CR42","doi-asserted-by":"crossref","unstructured":"Chen X, Zhao Z, Yu F, Zhang Y, Duan M (2021) Conditional diffusion for interactive segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 7345\u20137354","DOI":"10.1109\/ICCV48922.2021.00725"},{"key":"1680_CR43","doi-asserted-by":"crossref","unstructured":"Hao Y, Liu Y, Wu Z, Han L, Chen Y, Chen G, Chu L, Tang S, Yu Z, Chen Z et al (2021) Edgeflow: achieving practical interactive segmentation with edge-guided flow. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 1551\u20131560","DOI":"10.1109\/ICCVW54120.2021.00180"},{"key":"1680_CR44","doi-asserted-by":"crossref","unstructured":"Liew J, Wei Y, Xiong W, Ong S-H, Feng J (2017) Regional interactive image segmentation networks. In: 2017 IEEE international conference on computer vision (ICCV). IEEE, pp 2746\u20132754","DOI":"10.1109\/ICCV.2017.297"},{"issue":"1","key":"1680_CR45","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1109\/TCSVT.2022.3202574","volume":"33","author":"L Yan","year":"2022","unstructured":"Yan L, Wang Q, Ma S, Wang J, Yu C (2022) Solve the puzzle of instance segmentation in videos: a weakly supervised framework with spatio-temporal collaboration. IEEE Trans Circuits Syst Video Technol 33(1):393\u2013406","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"1680_CR46","doi-asserted-by":"crossref","unstructured":"Yan L, Wang Q, Zhao J, Guan Q, Tang Z, Zhang J, Liu D (2024) Radiance field learners as uav first-person viewers. In: European conference on computer vision. Springer, pp 88\u2013107","DOI":"10.1007\/978-3-031-73030-6_6"},{"key":"1680_CR47","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Adv Neural Inf Process Syst 30"},{"key":"1680_CR48","doi-asserted-by":"crossref","unstructured":"Antol S, Agrawal A, Lu J, Mitchell M, Batra D, Zitnick CL, Parikh D (2015) Vqa: Visual question answering. In: Proceedings of the IEEE international conference on computer vision, pp 2425\u20132433","DOI":"10.1109\/ICCV.2015.279"},{"key":"1680_CR49","first-page":"689","volume":"11","author":"J Ngiam","year":"2011","unstructured":"Ngiam J, Khosla A, Kim M, Nam J, Lee H, Ng AY et al (2011) Multimodal deep learning. ICML 11:689\u2013696","journal-title":"ICML"},{"key":"1680_CR50","doi-asserted-by":"crossref","unstructured":"Qian R, Garg D, Wang Y, You Y, Belongie S, Hariharan B, Campbell M, Weinberger KQ, Chao W-L (2020) End-to-end pseudo-lidar for image-based 3d object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5881\u20135890","DOI":"10.1109\/CVPR42600.2020.00592"},{"key":"1680_CR51","doi-asserted-by":"crossref","unstructured":"Lin Z, Duan Z-P, Zhang Z, Guo C-L, Cheng M-M (2022) Focuscut: Diving into a focus view in interactive segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2637\u20132646","DOI":"10.1109\/CVPR52688.2022.00266"},{"key":"1680_CR52","doi-asserted-by":"crossref","unstructured":"Hariharan B, Arbel\u00e1ez P, Bourdev L, Maji S, Malik J (2011) Semantic contours from inverse detectors. In: 2011 international conference on computer vision. IEEE, pp 991\u2013998","DOI":"10.1109\/ICCV.2011.6126343"},{"key":"1680_CR53","doi-asserted-by":"crossref","unstructured":"Gupta A, Dollar P, Girshick R (2019) Lvis: a dataset for large vocabulary instance segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 5356\u20135364","DOI":"10.1109\/CVPR.2019.00550"},{"key":"1680_CR54","doi-asserted-by":"crossref","unstructured":"Martin D, Fowlkes C, Tal D, Malik J (2001) A database of human segmented natural images and its application to evaluating segmentation algorithms and measuring ecological statistics. In: Proceedings eighth IEEE international conference on computer vision. ICCV 2001, vol 2. IEEE, pp 416\u2013423","DOI":"10.1109\/ICCV.2001.937655"},{"key":"1680_CR55","doi-asserted-by":"crossref","unstructured":"Perazzi F, Pont-Tuset J, McWilliams B, Van\u00a0Gool L, Gross M, Sorkine-Hornung A (2016) A benchmark dataset and evaluation methodology for video object segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 724\u2013732","DOI":"10.1109\/CVPR.2016.85"},{"key":"1680_CR56","doi-asserted-by":"crossref","unstructured":"Song S, Yu S, Zhou H, Huang X, Yu L, Xiao J (2025) Diffclick: click-differentiated enhancement network for interactive segmentation. Pattern Recogn 112217","DOI":"10.1016\/j.patcog.2025.112217"},{"key":"1680_CR57","doi-asserted-by":"crossref","unstructured":"Liu Q, Xu Z, Bertasius G, Niethammer M (2023) Simpleclick: interactive image segmentation with simple vision transformers. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 22290\u201322300","DOI":"10.1109\/ICCV51070.2023.02037"},{"key":"1680_CR58","doi-asserted-by":"crossref","unstructured":"Havrylov V, Huang H, Zhang D, Geiger A (2025) Benchmarking feature upsampling methods for vision foundation models using interactive segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 210\u2013219","DOI":"10.1109\/ICCVW69036.2025.00028"},{"key":"1680_CR59","doi-asserted-by":"crossref","unstructured":"Zhou M, Wang H, Zhao Q, Li Y, Huang Y, Meng D, Zheng Y (2023) Interactive segmentation as gaussion process classification. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 19488\u201319497","DOI":"10.1109\/CVPR52729.2023.01867"},{"key":"1680_CR60","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1109\/TIP.2023.3338003","volume":"33","author":"J Lin","year":"2023","unstructured":"Lin J, Xiao Z, Wei X, Duan P, He X, Dian R, Li Z, Li S (2023) Click-pixel cognition fusion network with balanced cut for interactive image segmentation. IEEE Trans Image Process 33:177\u2013190","journal-title":"IEEE Trans Image Process"},{"key":"1680_CR61","doi-asserted-by":"crossref","unstructured":"Huang Y, Yang H, Sun K, Zhang S, Cao L, Jiang G, Ji R (2023) Interformer: real-time interactive image segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 22301\u201322311","DOI":"10.1109\/ICCV51070.2023.02038"},{"key":"1680_CR62","doi-asserted-by":"crossref","unstructured":"Rana AK, Mahadevan S, Hermans A, Leibe B (2023) Dynamite: Dynamic query bootstrapping for multi-object interactive segmentation transformer. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 1043\u20131052","DOI":"10.1109\/ICCV51070.2023.00102"},{"key":"1680_CR63","doi-asserted-by":"crossref","unstructured":"Du F, Yuan J, Wang Z, Wang F (2023) Efficient mask correction for click-based interactive image segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 22773\u201322782","DOI":"10.1109\/CVPR52729.2023.02181"},{"key":"1680_CR64","doi-asserted-by":"crossref","unstructured":"Liu Q, Xu Z, Jiao Y, Niethammer M (2022) isegformer: interactive segmentation via transformers with application to 3d knee mr images. In: International conference on medical image computing and computer-assisted intervention. Springer, pp 464\u2013474","DOI":"10.1007\/978-3-031-16443-9_45"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01680-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-026-01680-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01680-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T05:45:57Z","timestamp":1777700757000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-026-01680-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,5,2]]},"references-count":64,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["1680"],"URL":"https:\/\/doi.org\/10.1007\/s10044-026-01680-5","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,5,2]]},"assertion":[{"value":"22 January 2026","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 April 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 May 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"96"}}