{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,22]],"date-time":"2026-06-22T11:53:24Z","timestamp":1782129204698,"version":"3.54.5"},"reference-count":55,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,11,1]],"date-time":"2026-11-01T00:00:00Z","timestamp":1793491200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100004775","name":"Gansu Provincial Natural Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004775","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Information Fusion"],"published-print":{"date-parts":[[2026,11]]},"DOI":"10.1016\/j.inffus.2026.104470","type":"journal-article","created":{"date-parts":[[2026,5,12]],"date-time":"2026-05-12T10:04:12Z","timestamp":1778580252000},"page":"104470","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["Deepest-only integration of vision and textual semantics in expectation-maximization space for generalizable medical image segmentation"],"prefix":"10.1016","volume":"135","author":[{"given":"Wenjun","family":"Yu","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yinchen","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jia-Xuan","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shubin","family":"Zeng","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuee","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8648-9999","authenticated-orcid":false,"given":"Zhong","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"key":"10.1016\/j.inffus.2026.104470_sbref0001","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2023.123052","article-title":"Deep semi-supervised learning for medical image segmentation: a review","volume":"245","author":"Han","year":"2024","journal-title":"Expert Syst. Appl."},{"key":"10.1016\/j.inffus.2026.104470_bib0002","unstructured":"Z. Li, Y. Li, Q. Li, P. Wang, D. Guo, L. Lu, D. Jin, Y. Zhang, Q. Hong, LViT: language meets vision transformer in medical image segmentation, 2023. https:\/\/arxiv.org\/abs\/2206.14718. 2206.14718."},{"key":"10.1016\/j.inffus.2026.104470_sbref0003","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2023.105770","article-title":"An efficient framework for optic disk segmentation and classification of Glaucoma on fundus images","volume":"89","author":"Sanghavi","year":"2024","journal-title":"Biomed. Signal Process. Control"},{"key":"10.1016\/j.inffus.2026.104470_sbref0004","doi-asserted-by":"crossref","first-page":"468","DOI":"10.1016\/j.neunet.2023.10.046","article-title":"Combining external-latent attention for medical image segmentation","volume":"170","author":"Song","year":"2024","journal-title":"Neural Netw."},{"key":"10.1016\/j.inffus.2026.104470_bib0005","series-title":"Physical Principles of Medical Imaging","author":"Sprawls","year":"1995"},{"issue":"1","key":"10.1016\/j.inffus.2026.104470_bib0006","doi-asserted-by":"crossref","first-page":"151","DOI":"10.1007\/s10994-009-5152-4","article-title":"A theory of learning from different domains","volume":"79","author":"Ben-David","year":"2010","journal-title":"Mach. Learn."},{"key":"10.1016\/j.inffus.2026.104470_bib0007","unstructured":"K. Kamnitsas, C. Baumgartner, C. Ledig, V.F.J. Newcombe, J.P. Simpson, A.D. Kane, D.K. Menon, A. Nori, A. Criminisi, D. Rueckert, B. Glocker, Unsupervised domain adaptation in brain lesion segmentation with adversarial networks, 2016. https:\/\/arxiv.org\/abs\/1612.08894. 1612.08894."},{"key":"10.1016\/j.inffus.2026.104470_bib0008","doi-asserted-by":"crossref","unstructured":"Q. Dou, C. Ouyang, C. Chen, H. Chen, P.-A. Heng, Unsupervised cross-modality domain adaptation of convnets for biomedical image segmentations with adversarial loss, 2018. https:\/\/arxiv.org\/abs\/1804.10916. 1804.10916.","DOI":"10.24963\/ijcai.2018\/96"},{"issue":"5","key":"10.1016\/j.inffus.2026.104470_bib0009","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3400066","article-title":"A survey of unsupervised deep domain adaptation","volume":"11","author":"Wilson","year":"2020","journal-title":"ACM Trans. Intell. Syst. Technol."},{"key":"10.1016\/j.inffus.2026.104470_bib0010","series-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition","first-page":"9624","article-title":"Open domain generalization with domain-augmented meta-learning","author":"Shu","year":"2021"},{"key":"10.1016\/j.inffus.2026.104470_bib0011","doi-asserted-by":"crossref","unstructured":"S. Liu, S. Yin, L. Qu, M. Wang, Reducing domain gap in frequency and spatial domain for cross-modality domain adaptation on medical image segmentation, Proc. AAAI Conf. Artif. Intell. 37 (2023) 1719\u20131727.","DOI":"10.1609\/aaai.v37i2.25260"},{"key":"10.1016\/j.inffus.2026.104470_bib0012","doi-asserted-by":"crossref","unstructured":"Y. Xu, S. Xie, M. Reynolds, M. Ragoza, M. Gong, K. Batmanghelich, Adversarial consistency for single domain generalization in medical image segmentation, in: International Conference on Medical Image Computing and Computer-Assisted Intervention, Springer, 2022, pp. 671\u2013681.","DOI":"10.1007\/978-3-031-16449-1_64"},{"key":"10.1016\/j.inffus.2026.104470_bib0013","doi-asserted-by":"crossref","first-page":"4131","DOI":"10.1109\/TMI.2025.3564474","article-title":"Domain-generalized discrete diffusion model for cross-domain medical image segmentation","volume":"44","author":"Yang","year":"2025","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.inffus.2026.104470_bib0014","doi-asserted-by":"crossref","unstructured":"Z. Su, K. Yao, X. Yang, Q. Wang, J. Sun, K. Huang, Rethinking data augmentation for single-source domain generalization in medical image segmentation, Proc. AAAI Conf. Artif. Intell. 37 (2023) 2366\u20132374.","DOI":"10.1609\/aaai.v37i2.25332"},{"key":"10.1016\/j.inffus.2026.104470_bib0015","doi-asserted-by":"crossref","unstructured":"S. Hu, Z. Liao, Y. Xia, Devil is in channels: Contrastive single domain generalization for medical image segmentation, in: International Conference on Medical Image Computing and Computer-Assisted Intervention, Springer, 2023, pp. 14\u201323.","DOI":"10.1007\/978-3-031-43901-8_2"},{"issue":"1","key":"10.1016\/j.inffus.2026.104470_bib0016","doi-asserted-by":"crossref","first-page":"96","DOI":"10.1109\/TMI.2023.3291719","article-title":"LViT: language meets vision transformer in medical image segmentation","volume":"43","author":"Li","year":"2023","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.inffus.2026.104470_bib0017","unstructured":"A. Radford, J. Kim, C. Hallacy, A. Ramesh, G. Goh, S. Agarwal, G. Sastry, A. Askell, P. Mishkin, J. Clark, G. Krueger, I. Sutskever, Learning transferable visual models from natural language supervision, in: International Conference on Machine Learning, PMLR, 2021, pp. 8748\u20138763."},{"key":"10.1016\/j.inffus.2026.104470_bib0018","series-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"28619","article-title":"Stronger fewer & superior: harnessing vision foundation models for domain generalized semantic segmentation","author":"Wei","year":"2024"},{"key":"10.1016\/j.inffus.2026.104470_bib0019","series-title":"European Conference on Computer Vision","first-page":"37","article-title":"Textual query-driven mask transformer for domain generalized segmentation","author":"Pak","year":"2024"},{"key":"10.1016\/j.inffus.2026.104470_sbref0020","first-page":"1","article-title":"Domain generalization: a survey","author":"Zhou","year":"2022","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.inffus.2026.104470_bib0021","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2026.113979","article-title":"Prototype-guided domain-invariant enhancement and domain-specific normalization for domain generalization semantic segmentation","volume":"167","author":"Liao","year":"2026","journal-title":"Eng. Appl. Artif. Intell."},{"key":"10.1016\/j.inffus.2026.104470_bib0022","doi-asserted-by":"crossref","first-page":"1095","DOI":"10.1109\/TMI.2022.3224067","article-title":"Causality-inspired single-source domain generalization for medical image segmentation","volume":"42","author":"Ouyang","year":"2022","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.inffus.2026.104470_bib0023","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2025.111550","article-title":"Concept-guided domain generalization for semantic segmentation","volume":"164","author":"Liao","year":"2025","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.inffus.2026.104470_sbref0024","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2025.103029","article-title":"Enhancing cross-domain generalization by fusing language-guided feature remapping","volume":"119","author":"Qiao","year":"2025","journal-title":"Inf. Fusion"},{"issue":"7981","key":"10.1016\/j.inffus.2026.104470_bib0025","doi-asserted-by":"crossref","first-page":"156","DOI":"10.1038\/s41586-023-06555-x","article-title":"A foundation model for generalizable disease detection from retinal images","volume":"622","author":"Zhou","year":"2023","journal-title":"Nature"},{"key":"10.1016\/j.inffus.2026.104470_bib0026","series-title":"Proceedings of the Computer Vision and Pattern Recognition Conference","first-page":"15043","article-title":"FisherTune: fisher-guided robust tuning of vision foundation models for domain generalized segmentation","author":"Zhao","year":"2025"},{"key":"10.1016\/j.inffus.2026.104470_bib0027","doi-asserted-by":"crossref","first-page":"94047","DOI":"10.52202\/079017-2983","article-title":"Learning frequency-adapted vision foundation model for domain generalized semantic segmentation","volume":"37","author":"Bi","year":"2024","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.inffus.2026.104470_bib0028","doi-asserted-by":"crossref","DOI":"10.1016\/j.media.2025.103547","article-title":"Medical SAM adapter: adapting segment anything model for medical image segmentation","volume":"102","author":"Wu","year":"2025","journal-title":"Med. Image Anal."},{"key":"10.1016\/j.inffus.2026.104470_bib0029","series-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","article-title":"DenseCLIP: language-guided dense prediction with context-aware prompting","author":"Rao","year":"2022"},{"key":"10.1016\/j.inffus.2026.104470_bib0030","article-title":"Domain-generalized token linking in vision foundation models for semantic segmentation","volume":"313","author":"Liao","year":"2025","journal-title":"Knowl. Based Syst."},{"key":"10.1016\/j.inffus.2026.104470_bib0031","article-title":"Cascaded interaction and selective calibration for unsupervised domain adaptive semantic segmentation in urban scenes","volume":"285","author":"Liao","year":"2026","journal-title":"Expert Syst. Appl."},{"key":"10.1016\/j.inffus.2026.104470_bib0032","first-page":"5998","article-title":"Attention is all you need","volume":"30","author":"Vaswani","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"1","key":"10.1016\/j.inffus.2026.104470_sbref0033","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","article-title":"Maximum likelihood from incomplete data via the EM algorithm","volume":"39","author":"Dempster","year":"1977","journal-title":"J. R. Stat. Soc. Ser. B (Methodological)"},{"key":"10.1016\/j.inffus.2026.104470_bib0034","doi-asserted-by":"crossref","unstructured":"X. Zhang, R.T. Tan, Mamba as a bridge: Where vision foundation models meet vision language models for domain-generalized semantic segmentation, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2025, pp. 14527\u201314537.","DOI":"10.1109\/CVPR52734.2025.01354"},{"key":"10.1016\/j.inffus.2026.104470_bib0035","first-page":"6586","article-title":"Hierarchical self-attention network for industrial data series modeling with different sampling rates between the input and output sequences","volume":"35","author":"Yuan","year":"2024","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.inffus.2026.104470_sbref0036","series-title":"2016 Fourth International Conference on 3D Vision (3DV)","article-title":"V-net: fully convolutional neural networks for volumetric medical image segmentation","author":"Milletari","year":"2016"},{"key":"10.1016\/j.inffus.2026.104470_sbref0037","series-title":"International Conference on Learning Representations (ICLR)","article-title":"Decoupled weight decay regularization","author":"Loshchilov","year":"2019"},{"issue":"11","key":"10.1016\/j.inffus.2026.104470_bib0038","doi-asserted-by":"crossref","first-page":"2514","DOI":"10.1109\/TMI.2018.2837502","article-title":"Deep learning techniques for automatic MRI cardiac multi-structures segmentation and diagnosis: is the problem solved?","volume":"37","author":"Bernard","year":"2018","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.inffus.2026.104470_bib0039","doi-asserted-by":"crossref","unstructured":"Y. Tian, C. Wen, M. Shi, M.M. Afzal, H. Huang, M.O. Khan, Y. Luo, Y. Fang, M. Wang, FairDomain: achieving fairness in cross-domain medical image segmentation and classification, (2024). arXiv preprint arXiv: 2407.08813.","DOI":"10.1007\/978-3-031-73116-7_15"},{"key":"10.1016\/j.inffus.2026.104470_bib0040","series-title":"Medical Imaging 2018: Imaging Informatics for Healthcare, Research, and Applications","first-page":"55","article-title":"Retinal fundus images for glaucoma analysis: the RIGA dataset","volume":"10579","author":"Almazroa","year":"2018"},{"key":"10.1016\/j.inffus.2026.104470_bib0041","series-title":"2011 24th International Symposium on Computer-based Medical Systems (CBMS)","first-page":"1","article-title":"RIM-ONE: an open retinal image database for optic nerve evaluation","author":"Fumero","year":"2011"},{"key":"10.1016\/j.inffus.2026.104470_bib0042","series-title":"2014 IEEE 11th International Symposium on Biomedical Imaging (ISBI)","first-page":"53","article-title":"Drishti-GS: retinal image dataset for optic nerve head (onh) segmentation","author":"Sivaswamy","year":"2014"},{"key":"10.1016\/j.inffus.2026.104470_bib0043","doi-asserted-by":"crossref","DOI":"10.1016\/j.media.2019.101570","article-title":"Refuge challenge: a unified framework for evaluating automated methods for glaucoma assessment from fundus photographs","volume":"59","author":"Orlando","year":"2020","journal-title":"Med. Image Anal."},{"key":"10.1016\/j.inffus.2026.104470_bib0044","unstructured":"M. Oquab, T. Darcet, T. Moutakanni, H. Vo, M. Szafraniec, V. Khalidov, P. Fernandez, D. Haziza, F. Massa, A. El-Nouby, M. Assran, N. Ballas, W. Galuba, R. Howes, P.-Y. Huang, S.-W. Li, I. Misra, M. Rabbat, V. Sharma, G. Synnaeve, H. Xu, H. Jegou, J. Mairal, P. Labatut, A. Joulin, P. Bojanowski, DINOv2: Learning robust visual features without supervision, arXiv preprint arXiv: 2304.07193 (2023)."},{"key":"10.1016\/j.inffus.2026.104470_bib0045","series-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2015","first-page":"234","article-title":"U-net: convolutional networks for biomedical image segmentation","author":"Ronneberger","year":"2015"},{"key":"10.1016\/j.inffus.2026.104470_bib0046","unstructured":"T. Devries, G. Taylor, Improved regularization of convolutional neural networks with cutout, arXiv preprint arXiv: 1708.04552 (2017)."},{"key":"10.1016\/j.inffus.2026.104470_bib0047","unstructured":"Z. Xu, D. Liu, J. Yang, C. Raffel, M. Niethammer, Robust and generalizable visual representation learning via random convolutions, arXiv preprint arXiv: 2007.13003 (2020)."},{"key":"10.1016\/j.inffus.2026.104470_bib0048","unstructured":"K. Zhou, Y. Yang, Y. Qiao, T. Xiang, Domain generalization with mixstyle, arXiv preprint arXiv: 2104.02008 (2021)."},{"issue":"9","key":"10.1016\/j.inffus.2026.104470_bib0049","doi-asserted-by":"crossref","first-page":"2763","DOI":"10.1109\/TMI.2023.3264513","article-title":"H2Former: an efficient hierarchical hybrid transformer for medical image segmentation","volume":"42","author":"He","year":"2023","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.inffus.2026.104470_bib0050","series-title":"Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2024","first-page":"533","article-title":"Prompting segment anything model with domain-adaptive prototype for generalizable medical image segmentation","author":"Wei","year":"2024"},{"key":"10.1016\/j.inffus.2026.104470_bib0051","doi-asserted-by":"crossref","DOI":"10.1016\/j.neucom.2025.130120","article-title":"Multi-receptive field feature disentanglement with Distance-Aware Gaussian Brightness Augmentation for single-source domain generalization in medical image segmentation","volume":"638","author":"Wang","year":"2025","journal-title":"Neurocomputing"},{"key":"10.1016\/j.inffus.2026.104470_bib0052","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2024.106801","article-title":"Structure-aware single-source generalization with pixel-level disentanglement for joint optic disc and cup segmentation","volume":"99","author":"Jiang","year":"2025","journal-title":"Biomed. Signal Process. Control"},{"key":"10.1016\/j.inffus.2026.104470_bib0053","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2025.108814","article-title":"Frequency view feature interpolation and disentanglement for single-source domain generalization in retinal vessel segmentation","volume":"112","author":"Ma","year":"2026","journal-title":"Biomed. Signal Process. Control"},{"key":"10.1016\/j.inffus.2026.104470_bib0054","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2026.109828","article-title":"Disentangled contrastive learning with adaptive resampling for generalizable joint optic disc and cup segmentation","volume":"119","author":"Jiang","year":"2026","journal-title":"Biomed. Signal Process. Control"},{"key":"10.1016\/j.inffus.2026.104470_bib0055","unstructured":"J.-X. Jiang, W. Lei, Y. Wu, H. Wu, F. Li, Y. Xie, X. Zhang, Z. Wang, MFM-DA: instance-aware adaptor and hierarchical alignment for efficient domain adaptation in medical foundation models, arXiv preprint arXiv: 2503.00802 (2025)."}],"container-title":["Information Fusion"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1566253526003490?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1566253526003490?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,22]],"date-time":"2026-06-22T11:36:26Z","timestamp":1782128186000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1566253526003490"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,11]]},"references-count":55,"alternative-id":["S1566253526003490"],"URL":"https:\/\/doi.org\/10.1016\/j.inffus.2026.104470","relation":{},"ISSN":["1566-2535"],"issn-type":[{"value":"1566-2535","type":"print"}],"subject":[],"published":{"date-parts":[[2026,11]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Deepest-only integration of vision and textual semantics in expectation-maximization space for generalizable medical image segmentation","name":"articletitle","label":"Article Title"},{"value":"Information Fusion","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.inffus.2026.104470","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"104470"}}