{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:36:09Z","timestamp":1757619369651,"version":"3.44.0"},"publisher-location":"Singapore","reference-count":33,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819500352"},{"type":"electronic","value":"9789819500369"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-95-0036-9_39","type":"book-chapter","created":{"date-parts":[[2025,7,23]],"date-time":"2025-07-23T08:37:03Z","timestamp":1753259823000},"page":"460-471","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Multimodal Integration Based on Weak Alignment for Rectal Tumor Grading"],"prefix":"10.1007","author":[{"given":"Hongwu","family":"Liu","sequence":"first","affiliation":[]},{"given":"Shouhong","family":"Wan","sequence":"additional","affiliation":[]},{"given":"Chenyang","family":"Qiu","sequence":"additional","affiliation":[]},{"given":"Bingbing","family":"Zou","sequence":"additional","affiliation":[]},{"given":"Wanqin","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Risheng","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Peiquan","family":"Jin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,24]]},"reference":[{"key":"39_CR1","doi-asserted-by":"publisher","first-page":"423","DOI":"10.1016\/j.procs.2021.01.025","volume":"179","author":"D Sarwinda","year":"2021","unstructured":"Sarwinda, D., Paradisa, R., Bustamam, A., Anggia, P.: Deep learning in image classification using residual network (ResNet) variants for detection of colorectal cancer. Procedia Comput. Sci. 179, 423\u2013431 (2021)","journal-title":"Procedia Comput. Sci."},{"key":"39_CR2","doi-asserted-by":"crossref","unstructured":"Chauhan, T., Palivela, H. Tiwari, S.: Optimization and fine-tuning of DenseNet model for classification of COVID-19 cases in medical imaging. Int. J. Inform. Manage. Data Insights. 1, 100020 (2021)","DOI":"10.1016\/j.jjimei.2021.100020"},{"key":"39_CR3","doi-asserted-by":"publisher","first-page":"146533","DOI":"10.1109\/ACCESS.2019.2946000","volume":"7","author":"C Wang","year":"2019","unstructured":"Wang, C., Chen, D., Hao, L., et al.: Pulmonary image classification based on inception-v3 transfer learning model. IEEE Access 7, 146533\u2013146541 (2019)","journal-title":"IEEE Access"},{"key":"39_CR4","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1186\/s12880-022-00793-7","volume":"22","author":"H Kim","year":"2022","unstructured":"Kim, H., Cosa-Linan, A., Santhanam, N., et al.: Transfer learning for medical image classification: a literature review. BMC Med. Imaging 22, 69 (2022)","journal-title":"BMC Med. Imaging"},{"key":"39_CR5","doi-asserted-by":"crossref","unstructured":"Peng, H., Schwartz, R. Smith, N.: PaLM: a hybrid parser and language model. ArXiv Preprint arXiv:1909.02134 (2019)","DOI":"10.18653\/v1\/D19-1376"},{"key":"39_CR6","unstructured":"Touvron, H., Lavril, T., Izacard, G., et al.: LLaMA: open and efficient foundation language models. ArXiv Preprint arXiv:2302.13971 (2023)"},{"key":"39_CR7","doi-asserted-by":"crossref","unstructured":"Yenduri, G., Ramalingam, M., Selvi, G., et al.: GPT (generative pre-trained transformer)\u2013a comprehensive review on enabling technologies, potential applications, emerging challenges, and future directions. IEEE Access 12, 54608 (2024)","DOI":"10.1109\/ACCESS.2024.3389497"},{"key":"39_CR8","unstructured":"Glm, T., Zeng, A., Xu, B., et al.: ChatGLM: a family of large language models from GLM-130B to GLM-4 all tools. ArXiv Preprint arXiv:2406.12793 (2024)"},{"key":"39_CR9","unstructured":"Singhal, K., Tu, T., Gottweis, J., et al.: Towards expert-level medical question answering with large language models. ArXiv Preprint arXiv:2305.09617 (2023)"},{"key":"39_CR10","doi-asserted-by":"crossref","unstructured":"Li, Y., Li, Z., Zhang, K., et al.: ChatDoctor: a medical chat model fine-tuned on a large language model meta-AI (LLaMA) using medical domain knowledge. Cureus. 15 (2023)","DOI":"10.7759\/cureus.40895"},{"key":"39_CR11","unstructured":"Han, T., Adams, L., Papaioannou, J., et al.: MedAlpaca\u2013an open-source collection of medical conversational AI models and training data. ArXiv Preprint arXiv:2304.08247 (2023)"},{"key":"39_CR12","unstructured":"Wu, C., Zhang, X., Zhang, Y., et al.: PMC-LLaMA: Further finetuning LLaMA on medical papers. ArXiv Preprint arXiv:2304.14454. 2(6) (2023)"},{"key":"39_CR13","unstructured":"Wang, H., Liu, C., Xi, N., et al.: HuaTuo: tuning llama model with Chinese medical knowledge. ArXiv Preprint arXiv:2304.06975 (2023)"},{"key":"39_CR14","unstructured":"Toma, A., Lawler, P., Ba, J., et al.: Clinical camel: an open-source expert-level medical language model with dialogue-based knowledge encoding. ArXiv Preprint arXiv:2305.12031, 1 (2023)"},{"key":"39_CR15","unstructured":"Radford, A., Kim, J., Hallacy, C., et al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763 (2021)"},{"key":"39_CR16","doi-asserted-by":"crossref","unstructured":"Zhai, X., Wang, X., Mustafa, B., et al.: Lit: zero-shot transfer with locked-image text tuning. In: Proceedings of The IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18123\u201318133 (2022)","DOI":"10.1109\/CVPR52688.2022.01759"},{"key":"39_CR17","unstructured":"Li, J., Li, D., Savarese, S., Hoi, S.: Blip-2: bootstrapping language-image pre-training with frozen image encoders and large language models. In: International Conference on Machine Learning, pp. 19730\u201319742 (2023)"},{"key":"39_CR18","doi-asserted-by":"crossref","unstructured":"Liu, H., Son, K., Yang, J., et al.: Learning customized visual models with retrieval-augmented knowledge. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15148\u201315158 (2023)","DOI":"10.1109\/CVPR52729.2023.01454"},{"key":"39_CR19","doi-asserted-by":"crossref","unstructured":"Wang, Z., Wu, Z., Agarwal, D., Sun, J.: Medclip: contrastive learning from unpaired medical images and text. ArXiv Preprint arXiv:2210.10163 (2022)","DOI":"10.18653\/v1\/2022.emnlp-main.256"},{"key":"39_CR20","doi-asserted-by":"crossref","unstructured":"Zhang, S., Xu, Y., Usuyama, N., et al.: A multimodal biomedical foundation model trained from fifteen million image\u2013text pairs. NEJM AI. 2(1), AIoa2400640 (2025)","DOI":"10.1056\/AIoa2400640"},{"key":"39_CR21","unstructured":"Alayrac, J., Donahue, J., Luc, P., et al.: Flamingo: a visual language model for few-shot learning. In: Advances in Neural Information Processing Systems, vol. 35, pp. 23716\u201323736 (2022)"},{"key":"39_CR22","unstructured":"Moor, M., Huang, Q., Wu, S., et al.: Med-Flamingo: a multimodal medical few-shot learner. In: Machine Learning for Health (ML4H), pp. 353\u2013367 (2023)"},{"key":"39_CR23","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: convolutional networks for biomedical image segmentation. In: Medical Image Computing and Computer-assisted Intervention\u2013MICCAI 2015: 18th International Conference, Munich, Germany, October 5\u20139, 2015, Proceedings, Part III 18, pp. 234\u2013241 (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"39_CR24","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Gao, J., Zhou, M., et al.: Text-guided foundation model adaptation for pathological image classification. In: International Conference on Medical Image Computing and Computer-Assisted Intervention, pp. 272\u2013282 (2023)","DOI":"10.1007\/978-3-031-43904-9_27"},{"key":"39_CR25","unstructured":"Zhang, Y., Jiang, H., Miura, Y., et al.: Contrastive learning of medical visual representations from paired images and text. In: Machine Learning for Healthcare Conference, pp. 2\u201325 (2022)"},{"key":"39_CR26","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., et al.: An image is worth 16 \u00d7 16 words: transformers for image recognition at scale. ArXiv Preprint arXiv:2010.11929 (2020)"},{"key":"39_CR27","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., et al.: Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference On Computer Vision, pp. 10012\u201310022 (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"39_CR28","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., et al.: Masked autoencoders are scalable vision learners. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16000\u201316009 (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"39_CR29","doi-asserted-by":"crossref","unstructured":"Simon, K.: Colorectal cancer development and advances in screening. Clin. Interv. Aging. 11, 967\u2013976 (2016)","DOI":"10.2147\/CIA.S109285"},{"key":"39_CR30","doi-asserted-by":"crossref","unstructured":"Islam, R., Moushi, O.: GPT-4o: The Cutting-Edge Advancement in Multimodal LLM. Authorea Preprints (2024)","DOI":"10.36227\/techrxiv.171986596.65533294\/v1"},{"key":"39_CR31","doi-asserted-by":"crossref","unstructured":"Zhang, K., Zhou, R., Adhikarla, E., et al.: A generalist vision\u2013language foundation model for diverse biomedical tasks. Nature Med. 30, 1\u201313 (2024)","DOI":"10.1038\/s41591-024-03185-2"},{"key":"39_CR32","doi-asserted-by":"crossref","unstructured":"Hamamci, I.E., Er, S., Almas, F., et al.: Developing generalist foundation models from a multimodal dataset for 3D computed tomography. arXiv preprint arXiv:2403.17834 (2024)","DOI":"10.21203\/rs.3.rs-5271327\/v1"},{"issue":"1","key":"39_CR33","doi-asserted-by":"publisher","first-page":"824","DOI":"10.1038\/s41597-024-03658-6","volume":"11","author":"M Jian","year":"2024","unstructured":"Jian, M., Chen, H., Zhang, Z., et al.: A lung nodule dataset with histopathology-based cancer type annotation. Sci. Data. 11(1), 824 (2024)","journal-title":"Sci. Data."}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-0036-9_39","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T19:49:48Z","timestamp":1757274588000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-0036-9_39"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819500352","9789819500369"],"references-count":33,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-0036-9_39","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"24 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}