{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T06:23:45Z","timestamp":1770704625442,"version":"3.49.0"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"24","license":[{"start":{"date-parts":[[2024,1,15]],"date-time":"2024-01-15T00:00:00Z","timestamp":1705276800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,15]],"date-time":"2024-01-15T00:00:00Z","timestamp":1705276800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-023-18027-5","type":"journal-article","created":{"date-parts":[[2024,1,15]],"date-time":"2024-01-15T08:02:34Z","timestamp":1705305754000},"page":"65221-65247","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Multi-modal bilinear fusion with hybrid attention mechanism for multi-label skin lesion classification"],"prefix":"10.1007","volume":"83","author":[{"given":"Yun","family":"Wei","sequence":"first","affiliation":[]},{"given":"Lin","family":"Ji","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,1,15]]},"reference":[{"issue":"1","key":"18027_CR1","doi-asserted-by":"publisher","first-page":"7","DOI":"10.3322\/caac.21442","volume":"68","author":"RL Siegel","year":"2018","unstructured":"Siegel RL, Miller KD, Jemal A (2018) Cancer statistics, 2018. CA Cancer J Clin 68(1):7\u201330","journal-title":"CA Cancer J Clin"},{"issue":"5","key":"18027_CR2","doi-asserted-by":"publisher","first-page":"839","DOI":"10.1016\/S0190-9622(96)90041-9","volume":"34","author":"DS Rigel","year":"1996","unstructured":"Rigel DS, Friedman RJ, Kopf AW (1996) The incidence of malignant melanoma in the United States: issues as we approach the 21st century. J Am Acad Dermatol 34(5):839\u2013847. https:\/\/doi.org\/10.1016\/S0190-9622(96)90041-9","journal-title":"J Am Acad Dermatol"},{"issue":"10","key":"18027_CR3","doi-asserted-by":"publisher","first-page":"1081","DOI":"10.1001\/jamadermatol.2015.1187","volume":"151","author":"HW Rogers","year":"2015","unstructured":"Rogers HW, Weinstock MA, Feldman SR, Coldiron BM (2015) Incidence estimate of nonmelanoma skin cancer (keratinocyte carcinomas) in the US population, 2012. JAMA Dermatol 151(10):1081\u20131086","journal-title":"JAMA Dermatol"},{"issue":"5","key":"18027_CR4","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0000483","volume":"2","author":"C Massone","year":"2007","unstructured":"Massone C, Hofmann-Wellenhof R, Ahlgrimm-Siess V, Gabler G, Ebner C, Peter Soyer H (2007) Melanoma screening with cellular phones. PLoS ONE 2(5):e483","journal-title":"PLoS ONE"},{"issue":"7553","key":"18027_CR5","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton G (2015) Deep learning. Nature 521(7553):436\u2013444","journal-title":"Nature"},{"key":"18027_CR6","doi-asserted-by":"publisher","first-page":"270","DOI":"10.1007\/978-3-662-45139-7_116","volume":"69","author":"C Barata","year":"2017","unstructured":"Barata C, Celebi ME, Marques JS (2017) Development of a clinically oriented system for melanoma diagnosis. Pattern Recogn 69:270\u2013285. https:\/\/doi.org\/10.1007\/978-3-662-45139-7_116","journal-title":"Pattern Recogn"},{"key":"18027_CR7","doi-asserted-by":"publisher","unstructured":"Duma S (2015) Dermoscopy of pigmented skin lesions. In: European Handbook of Dermatological Treatments. Springer, Berlin, Heidelberg, pp 1167\u20131177. https:\/\/doi.org\/10.1016\/j.jaad.2001.11.001","DOI":"10.1016\/j.jaad.2001.11.001"},{"key":"18027_CR8","doi-asserted-by":"crossref","unstructured":"Argenziano G, Catrical\u00e0 C, Ardigo M, Buccini P, De Simone P, Eibenschutz L \u2026 Zalaudek I (2011) Dermoscopy of patients with multiple nevi: Improved management recommendations using a comparative diagnostic approach. Arch Dermatol 147(1):46\u201349","DOI":"10.1001\/archdermatol.2010.389"},{"issue":"1","key":"18027_CR9","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1016\/j.patcog.2012.07.027","volume":"46","author":"Q Abbas","year":"2013","unstructured":"Abbas Q, Celebi ME, Serrano C, Garcia IF, Ma G (2013) Pattern classification of dermoscopy images: a perceptually uniform model. Pattern Recogn 46(1):86\u201397. https:\/\/doi.org\/10.1016\/j.patcog.2012.07.027","journal-title":"Pattern Recogn"},{"issue":"6","key":"18027_CR10","doi-asserted-by":"publisher","first-page":"1052","DOI":"10.1016\/j.patcog.2008.07.011","volume":"42","author":"C Serrano","year":"2009","unstructured":"Serrano C, Acha B (2009) Pattern analysis of dermoscopic images based on Markov random fields. Pattern Recognit 42(6):1052\u20131057","journal-title":"Pattern Recognit"},{"issue":"9","key":"18027_CR11","doi-asserted-by":"publisher","first-page":"2065","DOI":"10.1109\/TBME.2017.2712771","volume":"64","author":"L Bi","year":"2017","unstructured":"Bi L, Kim J, Ahn E, Kumar A, Fulham M, Feng D (2017) Dermoscopic image segmentation via multistage fully convolutional networks. IEEE Trans Biomed Eng 64(9):2065\u20132074","journal-title":"IEEE Trans Biomed Eng"},{"issue":"9","key":"18027_CR12","doi-asserted-by":"publisher","first-page":"1892","DOI":"10.1016\/j.patcog.2010.10.024","volume":"44","author":"K Bunte","year":"2011","unstructured":"Bunte K, Biehl M, Jonkman MF, Petkov N (2011) Learning effective color features for content based image retrieval in dermatology. Pattern Recogn 44(9):1892\u20131902. https:\/\/doi.org\/10.1016\/j.patcog.2010.10.024","journal-title":"Pattern Recogn"},{"issue":"3","key":"18027_CR13","doi-asserted-by":"publisher","first-page":"1146","DOI":"10.1109\/ICIP.2014.7025716","volume":"19","author":"C Barata","year":"2014","unstructured":"Barata C, Celebi ME, Marques JS (2014) Improving dermoscopy image classification using color constancy. IEEE J Biomed Health Inform 19(3):1146\u20131152. https:\/\/doi.org\/10.1109\/ICIP.2014.7025716","journal-title":"IEEE J Biomed Health Inform"},{"issue":"5","key":"18027_CR14","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TMI.2014.2305769","volume":"33","author":"A Saez","year":"2014","unstructured":"Saez A, Serrano C, Acha B (2014) Model-based classification methods of global patterns in dermoscopic images. IEEE Trans Med Imaging 33(5):1137\u20131147. https:\/\/doi.org\/10.1109\/TMI.2014.2305769","journal-title":"IEEE Trans Med Imaging"},{"issue":"1","key":"18027_CR15","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.patcog.2012.07.001","volume":"46","author":"L Ma","year":"2013","unstructured":"Ma L, Staunton RC (2013) Analysis of the contour structural irregularity of skin lesions using wavelet decomposition. Pattern Recogn 46(1):98\u2013106","journal-title":"Pattern Recogn"},{"key":"18027_CR16","unstructured":"Zhang J, Cui L, Gouza FB (2018) SEGEN: sample-ensemble genetic evolutional network model. arXiv preprint arXiv:1803.08631"},{"key":"18027_CR17","doi-asserted-by":"crossref","unstructured":"Liu D, Cui Y, Tan W, Chen Y (2021) Sg-net: spatial granularity network for one-stage video instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 9816\u20139825","DOI":"10.1109\/CVPR46437.2021.00969"},{"key":"18027_CR18","unstructured":"Liang J, Zhou T, Liu D, Wang W (2023) CLUSTSEG: Clustering for Universal Segmentation. arXiv preprint arXiv:2305.02187"},{"issue":"9","key":"18027_CR19","doi-asserted-by":"publisher","first-page":"2092","DOI":"10.1109\/TMI.2019.2893944","volume":"38","author":"J Zhang","year":"2019","unstructured":"Zhang J, Xie Y, Xia Y, Shen C (2019) Attention residual learning for skin lesion classification. IEEE Trans Med Imaging 38(9):2092\u20132103","journal-title":"IEEE Trans Med Imaging"},{"key":"18027_CR20","doi-asserted-by":"publisher","first-page":"7160","DOI":"10.1109\/ACCESS.2019.2962812","volume":"8","author":"AA Adegun","year":"2019","unstructured":"Adegun AA, Viriri S (2019) Deep learning-based system for automatic melanoma detection. IEEE Access 8:7160\u20137172","journal-title":"IEEE Access"},{"key":"18027_CR21","first-page":"12826","volume":"35","author":"W Wang","year":"2022","unstructured":"Wang W, Liang J, Liu D (2022) Learning equivariant segmentation with instance-unique querying. Adv Neural Inf Process Syst 35:12826\u201312840","journal-title":"Adv Neural Inf Process Syst"},{"key":"18027_CR22","doi-asserted-by":"publisher","unstructured":"Harangi B (2017) Skin lesion detection based on an ensemble of deep convolutional neural network. arXiv preprint arXiv:1705.03360. https:\/\/doi.org\/10.1016\/j.jbi.2018.08.006","DOI":"10.1016\/j.jbi.2018.08.006"},{"issue":"11","key":"18027_CR23","doi-asserted-by":"publisher","first-page":"1261","DOI":"10.1111\/exd.13777","volume":"27","author":"J Yap","year":"2018","unstructured":"Yap J, Yolland W, Tschandl P (2018) Multimodal skin lesion classification using deep learning. Exp Dermatol 27(11):1261\u20131267","journal-title":"Exp Dermatol"},{"key":"18027_CR24","doi-asserted-by":"publisher","unstructured":"Li W, Zhuang J, Wang R, Zhang J, Zheng WS (2020) Fusing metadata and dermoscopy images for skin disease diagnosis. In: 2020 IEEE 17th international symposium on biomedical imaging (ISBI), pp 1996\u20132000. IEEE. https:\/\/doi.org\/10.1109\/ISBI45749.2020.9098645","DOI":"10.1109\/ISBI45749.2020.9098645"},{"issue":"2","key":"18027_CR25","doi-asserted-by":"publisher","first-page":"538","DOI":"10.1109\/JBHI.2018.2824327","volume":"23","author":"J Kawahara","year":"2018","unstructured":"Kawahara J, Daneshvar S, Argenziano G, Hamarneh G (2018) Seven-point checklist and skin lesion classification using multitask multimodal neural nets. IEEE J Biomed Health Inform 23(2):538\u2013546","journal-title":"IEEE J Biomed Health Inform"},{"key":"18027_CR26","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2021.102307","volume":"76","author":"P Tang","year":"2022","unstructured":"Tang P, Yan X, Nan Y, Xiang S, Krammer S, Lasser T (2022) FusionM4Net: a multi-stage multi-modal learning algorithm for multi-label skin lesion classification. Med Image Anal 76:102307","journal-title":"Med Image Anal"},{"key":"18027_CR27","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107502","volume":"107","author":"L Bi","year":"2020","unstructured":"Bi L, Feng DD, Fulham M, Kim J (2020) Multi-label classification of multi-modality skin lesion via hyper-connected convolutional neural network. Pattern Recogn 107:107502. https:\/\/doi.org\/10.1016\/j.patcog.2020.107502","journal-title":"Pattern Recogn"},{"key":"18027_CR28","doi-asserted-by":"crossref","unstructured":"Ge Z, Demyanov S, Chakravorty R, Bowling A, Garnavi R (2017) Skin disease recognition using deep saliency features and multimodal learning of dermoscopy and clinical images. In: Medical Image Computing and Computer Assisted Intervention\u2212 MICCAI 2017: 20th International Conference, Quebec City, QC, Canada, September 11\u201313, 2017, Proceedings, Part III 20. Springer International Publishing, pp 250\u2013258","DOI":"10.1007\/978-3-319-66179-7_29"},{"key":"18027_CR29","doi-asserted-by":"crossref","unstructured":"Wu Y, Lariba AC, Chen H, Zhao H (2022) Skin lesion classification based on deep convolutional neural network. In: 2022 IEEE 4th International Conference on Power, Intelligent Computing and Systems (ICPICS). IEEE, pp 376\u2013380","DOI":"10.1109\/ICPICS55264.2022.9873756"},{"key":"18027_CR30","doi-asserted-by":"crossref","unstructured":"Bhattacharya I, Seetharaman A, Kunder C, Shao W, Chen LC, Soerensen SJ \u2026 Rusu M (2022) Selective identification and localization of indolent and aggressive prostate cancers via CorrSigNIA: an MRI-pathology correlation and deep learning framework. Med Image Anal 75:102288","DOI":"10.1016\/j.media.2021.102288"},{"issue":"2","key":"18027_CR31","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1162\/NECO_a_00801","volume":"28","author":"S Chandar","year":"2016","unstructured":"Chandar S, Khapra MM, Larochelle H, Ravindran B (2016) Correlational neural networks. Neural Comput 28(2):257\u2013285","journal-title":"Neural Comput"},{"issue":"2","key":"18027_CR32","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1016\/j.bbe.2022.02.009","volume":"42","author":"Y Guo","year":"2022","unstructured":"Guo Y, Wang Y, Yang H, Zhang J, Sun Q (2022) Dual-attention EfficientNet based on multi-view feature fusion for cervical squamous intraepithelial lesions diagnosis. Biocybern Biomed Eng 42(2):529\u2013542","journal-title":"Biocybern Biomed Eng"},{"key":"18027_CR33","doi-asserted-by":"crossref","unstructured":"Roy AG, Navab N, Wachinger C (2018) Concurrent spatial and channel \u2018squeeze & excitation\u2019in fully convolutional networks. In: Medical Image Computing and Computer Assisted Intervention\u2013MICCAI 2018: 21st International Conference, Granada, Spain, September 16\u201320, 2018, Proceedings, Part I. Springer International Publishing, pp 421\u2013429","DOI":"10.1007\/978-3-030-00928-1_48"},{"key":"18027_CR34","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2021.102700","volume":"68","author":"L Yan","year":"2021","unstructured":"Yan L, Li S, Guo Y, Ren P, Song H, Yang J, Shen X (2021) Multi-state colposcopy image fusion for cervical precancerous lesion diagnosis using BF-CNN. Biomed Signal Process Control 68:102700","journal-title":"Biomed Signal Process Control"},{"key":"18027_CR35","doi-asserted-by":"crossref","unstructured":"Yu Z, Yu J, Fan J, Tao D (2017) Multi-modal factorized bilinear pooling with co-attention learning for visual question answering. In: Proceedings of the IEEE international conference on computer vision, pp 1821\u20131830","DOI":"10.1109\/ICCV.2017.202"},{"key":"18027_CR36","unstructured":"Ruder S (2016) An overview of gradient descent optimization algorithms. arXiv preprint arXiv:1609.04747"},{"key":"18027_CR37","doi-asserted-by":"crossref","unstructured":"Afroze S, Hossain MR, Hoque MM, Dewan MAA (2023) An empirical framework for detecting speaking modes using ensemble classifier. Multimed Tools Appl:1\u201334","DOI":"10.1007\/s11042-023-15254-8"},{"key":"18027_CR38","unstructured":"Kingma DP, Adam BJ (2014) A method for stochastic optimization. arXiv e-prints. arXiv preprint arXiv:1412.6980, 1412"},{"key":"18027_CR39","unstructured":"Ngiam J, Khosla A, Kim M, Nam J, Lee H, Ng AY (2011) Multimodal deep learning. In: Proceedings of the 28th international conference on machine learning (ICML-11), pp 689\u2013696"},{"key":"18027_CR40","doi-asserted-by":"crossref","unstructured":"Wang W, Wang Y, Liu D, Hou W, Zhou T, Ji Z (2022) GeneSegNet: a deep learning framework for cell segmentation by integrating gene expression and imaging. bioRxiv, 2022-12","DOI":"10.1101\/2022.12.13.520283"},{"key":"18027_CR41","unstructured":"Wang W, Han C, Zhou T, Liu D (2022) Visual recognition with deep nearest centroids. arXiv preprint arXiv:2209.07383"},{"key":"18027_CR42","doi-asserted-by":"crossref","unstructured":"Venugopal V, Raj NI, Nath MK, Stephen N (2023) A deep neural network using modified EfficientNet for skin cancer detection in dermoscopic images. Decis Anal J:100278","DOI":"10.1016\/j.dajour.2023.100278"},{"key":"18027_CR43","doi-asserted-by":"crossref","unstructured":"Chattopadhay A, Sarkar A, Howlader P, Balasubramanian VN (2018) Grad-cam++: generalized gradient-based visual explanations for deep convolutional networks. In: 2018 IEEE winter conference on applications of computer vision (WACV). IEEE, pp 839\u2013847","DOI":"10.1109\/WACV.2018.00097"},{"key":"18027_CR44","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2022.103549","volume":"74","author":"Z Wei","year":"2022","unstructured":"Wei Z, Li Q, Song H (2022) Dual attention based network for skin lesion classification with auxiliary learning. Biomed Signal Process Control 74:103549","journal-title":"Biomed Signal Process Control"},{"key":"18027_CR45","doi-asserted-by":"crossref","unstructured":"Bayoudh K, Knani R, Hamdaoui F, Mtibaa A (2021) A survey on deep multimodal learning for computer vision: advances, trends, applications, and datasets. Vis Comput:1\u201332","DOI":"10.1007\/s00371-021-02166-7"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-18027-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-18027-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-18027-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,8]],"date-time":"2024-07-08T17:43:45Z","timestamp":1720460625000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-18027-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,15]]},"references-count":45,"journal-issue":{"issue":"24","published-online":{"date-parts":[[2024,7]]}},"alternative-id":["18027"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-18027-5","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,1,15]]},"assertion":[{"value":"2 January 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 September 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 December 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 January 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}