{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,18]],"date-time":"2026-02-18T13:10:19Z","timestamp":1771420219850,"version":"3.50.1"},"reference-count":41,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100013365","name":"West China Hospital, Sichuan University","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100013365","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["clinicalkey.com","clinicalkey.com.au","clinicalkey.es","clinicalkey.fr","clinicalkey.jp","elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Computerized Medical Imaging and Graphics"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1016\/j.compmedimag.2026.102706","type":"journal-article","created":{"date-parts":[[2026,1,11]],"date-time":"2026-01-11T15:11:04Z","timestamp":1768144264000},"page":"102706","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["ThyFusionNet: A CNN\u2013transformer framework with spatial aware sparse attention for multi modal thyroid disease diagnosis"],"prefix":"10.1016","volume":"128","author":[{"given":"Bing","family":"Yang","sequence":"first","affiliation":[]},{"given":"Jun","family":"Li","sequence":"additional","affiliation":[]},{"given":"Junyang","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Yutong","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Nanbo","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Qiurui","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Jiaxin","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Yuheng","family":"Zhou","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.compmedimag.2026.102706_bib1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.55969\/paradigmplus.v4n1a1","article-title":"Continuous eye disease severity evaluation system using siamese neural networks","volume":"4","author":"Abdulraheem","year":"2023","journal-title":"ParadigmPlus"},{"key":"10.1016\/j.compmedimag.2026.102706_bib2","doi-asserted-by":"crossref","first-page":"51","DOI":"10.19101\/IJACR.2021.1152001","article-title":"Multi-classification of Alzheimer disease on magnetic resonance images (MRI) using deep convolutional neural network (DCNN) approaches","volume":"11","author":"Ajagbe","year":"2021","journal-title":"Int. J. Adv. Comput. Res."},{"key":"10.1016\/j.compmedimag.2026.102706_bib3","doi-asserted-by":"crossref","first-page":"3675","DOI":"10.1007\/s00371-023-02984-x","article-title":"Sthy-net: a feature fusion-enhanced dense-branched modules network for small thyroid nodule classification from ultrasound images","volume":"39","author":"Al-Jebrni","year":"2023","journal-title":"Vis. Comput."},{"key":"10.1016\/j.compmedimag.2026.102706_bib4","unstructured":"Alom, M.Z., T.M. Taha, C. Yakopcic, S. Westberg, P. Sidike, M.S. Nasrin, B.C. Van Esesn, A.A.S. Awwal, and V.K. Asari. 2018. The history began from alexnet: A comprehensive survey on deep learning approaches. arXiv preprint arXiv:1803.01164."},{"key":"10.1016\/j.compmedimag.2026.102706_bib5","doi-asserted-by":"crossref","unstructured":"Al-Qizwini, M., I. Barjasteh, H. Al-Qassab, and H. Radha. Year 1. Deep learning algorithm for autonomous driving using googlenet. Proc. 2017 IEEE intelligent vehicles symposium (IV).","DOI":"10.1109\/IVS.2017.7995703"},{"key":"10.1016\/j.compmedimag.2026.102706_bib6","article-title":"Signature verification using a siamese time delay neural network","volume":"6","author":"Bromley","year":"1993","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.compmedimag.2026.102706_bib7","doi-asserted-by":"crossref","unstructured":"Caron, M., Touvron, H., Misra, I., J\u00e9gou, H., Mairal, J., Bojanowski, P., Joulin, A., 2021. Emerging properties in self-supervised vision transformers, Proceedings of the IEEE\/CVF international conference on computer vision. pp. 9650-9660.","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"10.1016\/j.compmedimag.2026.102706_bib8","series-title":"Simclr: A simple framework for contrastive learning of visual representations, International Conference on Learning Representations","author":"Chen","year":"2020"},{"key":"10.1016\/j.compmedimag.2026.102706_bib9","doi-asserted-by":"crossref","unstructured":"Chen, P.-C., H. Tsai, S. Bhojanapalli, H.W. Chung, Y.-W. Chang, and C.-S. Ferng. 2021. A simple and effective positional encoding for transformers. arXiv preprint arXiv:2104.08698.","DOI":"10.18653\/v1\/2021.emnlp-main.236"},{"key":"10.1016\/j.compmedimag.2026.102706_bib10","doi-asserted-by":"crossref","first-page":"1384","DOI":"10.3390\/diagnostics11081384","article-title":"Transmed: Transformers advance multi-modal medical image classification","volume":"11","author":"Dai","year":"2021","journal-title":"Diagnostics"},{"key":"10.1016\/j.compmedimag.2026.102706_bib11","unstructured":"Dosovitskiy, A., L. Beyer, A. Kolesnikov, D. Weissenborn, X. Zhai, T. Unterthiner, M. Dehghani, M. Minderer, G. Heigold, and S. Gelly. 2020. An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929."},{"key":"10.1016\/j.compmedimag.2026.102706_bib12","unstructured":"Gower, R.M., Loizou, N., Qian, X., Sailanbayev, A., Shulgin, E., Richt\u00e1rik, P., 2019. SGD: General analysis and improved rates, International conference on machine learning. PMLR, pp. 5200-5209."},{"key":"10.1016\/j.compmedimag.2026.102706_bib13","doi-asserted-by":"crossref","unstructured":"Han, D., Pan, X., Han, Y., Song, S., Huang, G., 2023. Flatten transformer: Vision transformer using focused linear attention, Proceedings of the IEEE\/CVF international conference on computer vision. pp. 5961-5971.","DOI":"10.1109\/ICCV51070.2023.00548"},{"key":"10.1016\/j.compmedimag.2026.102706_bib14","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J., 2016. Deep residual learning for image recognition, Proceedings of the IEEE conference on computer vision and pattern recognition. pp. 770-778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"10.1016\/j.compmedimag.2026.102706_bib15","unstructured":"Iandola, F., M. Moskewicz, S. Karayev, R. Girshick, T. Darrell, and K. Keutzer. 2014. Densenet: Implementing efficient convnet descriptor pyramids. arXiv preprint arXiv:1404.1869."},{"key":"10.1016\/j.compmedimag.2026.102706_bib16","doi-asserted-by":"crossref","unstructured":"Kawahara, J., and G. Hamarneh. 2016. Multi-resolution-tract CNN with hybrid pretrained and skin-lesion trained layers. Pages 164-171.","DOI":"10.1007\/978-3-319-47157-0_20"},{"key":"10.1016\/j.compmedimag.2026.102706_bib17","doi-asserted-by":"crossref","DOI":"10.1002\/aisy.202200365","article-title":"Multimodal neural network for recurrence prediction of papillary thyroid carcinoma","volume":"5","author":"Kim","year":"2023","journal-title":"Adv. Intell. Syst."},{"key":"10.1016\/j.compmedimag.2026.102706_bib18","unstructured":"Kingma, D.P. 2014. Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980."},{"key":"10.1016\/j.compmedimag.2026.102706_bib19","doi-asserted-by":"crossref","unstructured":"Koonce, B. 2021. MobileNetV3. Pages 125-144 in Convolutional neural networks with swift for tensorflow: image recognition and dataset categorizationSpringer.","DOI":"10.1007\/978-1-4842-6168-2_11"},{"key":"10.1016\/j.compmedimag.2026.102706_bib20","doi-asserted-by":"crossref","unstructured":"Li, S., Y. Liu, X. Sui, C. Chen, G. Tjio, D.S.W. Ting, and R.S.M. Goh. 2019. Multi-instance multi-scale CNN for medical image classification. Pages 531-539.","DOI":"10.1007\/978-3-030-32251-9_58"},{"key":"10.1016\/j.compmedimag.2026.102706_bib21","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., Guo, B., 2021. Swin transformer: Hierarchical vision transformer using shifted windows, Proceedings of the IEEE\/CVF international conference on computer vision. pp. 10012-10022.","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"10.1016\/j.compmedimag.2026.102706_bib22","doi-asserted-by":"crossref","DOI":"10.1016\/j.compbiomed.2023.106791","article-title":"MedViT: a robust vision transformer for generalized medical image classification","volume":"157","author":"Manzari","year":"2023","journal-title":"Comput. Biol. Med."},{"key":"10.1016\/j.compmedimag.2026.102706_bib23","doi-asserted-by":"crossref","first-page":"2202","DOI":"10.3390\/s21062202","article-title":"Hepatocellular carcinoma automatic diagnosis within CEUS and B-mode ultrasound images using advanced machine learning methods","volume":"21","author":"Mitrea","year":"2021","journal-title":"Sensors"},{"key":"10.1016\/j.compmedimag.2026.102706_bib24","doi-asserted-by":"crossref","unstructured":"Naglah, A., F. Khalifa, R. Khaled, A. El-Baz, and et al. 2021. Thyroid cancer computer-aided diagnosis system using MRI-based multi-input CNN model. Pages 1691-1694.","DOI":"10.1109\/ISBI48211.2021.9433841"},{"key":"10.1016\/j.compmedimag.2026.102706_bib25","unstructured":"Oord, A. v d 1807 van den, Li, Y., & Vinyals, O. (2019). Representation Learning with Contrastive Predictive Coding (No. arXiv: 1807.03748). arXiv. 10.48550. arXiv."},{"key":"10.1016\/j.compmedimag.2026.102706_bib26","unstructured":"Powers, D.M. 2020. Evaluation: from precision, recall and F-measure to ROC, informedness, markedness and correlation. arXiv preprint arXiv:2010.16061."},{"key":"10.1016\/j.compmedimag.2026.102706_bib27","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision, International conference on machine learning","author":"Radford","year":"2021","journal-title":"PmLR"},{"key":"10.1016\/j.compmedimag.2026.102706_bib28","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., P. Fischer, and T. Brox. 2015. U-net: Convolutional networks for biomedical image segmentation. Pages 234-241.","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"10.1016\/j.compmedimag.2026.102706_bib29","series-title":"Mobilenetv2: Inverted residuals and linear bottlenecks","first-page":"4510","author":"Sandler","year":"2018"},{"key":"10.1016\/j.compmedimag.2026.102706_bib30","series-title":"Computer-based medical consultations: MYCIN","author":"Shortliffe","year":"2012"},{"key":"10.1016\/j.compmedimag.2026.102706_bib31","unstructured":"Simonyan, K., and A. Zisserman. 2014. Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556."},{"key":"10.1016\/j.compmedimag.2026.102706_bib32","first-page":"209","article-title":"Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries","volume":"71","author":"Sung","year":"2021","journal-title":"CA a cancer journal clinicians"},{"key":"10.1016\/j.compmedimag.2026.102706_bib33","doi-asserted-by":"crossref","first-page":"2870","DOI":"10.1109\/JBHI.2020.2977013","article-title":"GP-CNN-DTEL: global-part CNN model with data-transformed ensemble learning for skin lesion classification","volume":"24","author":"Tang","year":"2020","journal-title":"IEEE J. Biomed. Health Inform."},{"key":"10.1016\/j.compmedimag.2026.102706_bib34","series-title":"Maxvit: Multi-axis vision transformer, European conference on computer vision","first-page":"459","author":"Tu","year":"2022"},{"key":"10.1016\/j.compmedimag.2026.102706_bib35","doi-asserted-by":"crossref","unstructured":"Tu, Z., H. Talebi, H. Zhang, F. Yang, P. Milanfar, A. Bovik, and Y. Li. 2022b. Maxvit: Multi-axis vision transformer. Pages 459-479.","DOI":"10.1007\/978-3-031-20053-3_27"},{"key":"10.1016\/j.compmedimag.2026.102706_bib36","article-title":"Attention is all you need","volume":"30","author":"Vaswani","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.compmedimag.2026.102706_bib37","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2019.107075","article-title":"Learning visual relationship and context-aware attention for image captioning","volume":"98","author":"Wang","year":"2020","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.compmedimag.2026.102706_bib38","doi-asserted-by":"crossref","unstructured":"Woo, S., Debnath, S., Hu, R., Chen, X., Liu, Z., Kweon, I.S., Xie, S., 2023. Convnext v2: Co-designing and scaling convnets with masked autoencoders, Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. pp. 16133-16142.","DOI":"10.1109\/CVPR52729.2023.01548"},{"key":"10.1016\/j.compmedimag.2026.102706_bib39","doi-asserted-by":"crossref","first-page":"9562","DOI":"10.1109\/TNNLS.2022.3158966","article-title":"RegNet: self-regulated network for image classification","volume":"34","author":"Xu","year":"2022","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.compmedimag.2026.102706_bib40","doi-asserted-by":"crossref","first-page":"9194","DOI":"10.1109\/TCYB.2021.3061147","article-title":"Two-stage selective ensemble of CNN via deep tree training for medical image classification","volume":"52","author":"Yang","year":"2021","journal-title":"IEEE Trans. Cybern."},{"key":"10.1016\/j.compmedimag.2026.102706_bib41","doi-asserted-by":"crossref","DOI":"10.1016\/j.neucom.2023.126577","article-title":"Class attention to regions of lesion for imbalanced medical image recognition","volume":"555","author":"Zhuang","year":"2023","journal-title":"Neurocomputing"}],"container-title":["Computerized Medical Imaging and Graphics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0895611126000091?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0895611126000091?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,2,18]],"date-time":"2026-02-18T12:33:08Z","timestamp":1771417988000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0895611126000091"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2]]},"references-count":41,"alternative-id":["S0895611126000091"],"URL":"https:\/\/doi.org\/10.1016\/j.compmedimag.2026.102706","relation":{},"ISSN":["0895-6111"],"issn-type":[{"value":"0895-6111","type":"print"}],"subject":[],"published":{"date-parts":[[2026,2]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"ThyFusionNet: A CNN\u2013transformer framework with spatial aware sparse attention for multi modal thyroid disease diagnosis","name":"articletitle","label":"Article Title"},{"value":"Computerized Medical Imaging and Graphics","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.compmedimag.2026.102706","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"102706"}}