{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:30:41Z","timestamp":1757619041163,"version":"3.44.0"},"publisher-location":"Singapore","reference-count":19,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819500260"},{"type":"electronic","value":"9789819500277"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-95-0027-7_10","type":"book-chapter","created":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T14:15:45Z","timestamp":1752675345000},"page":"104-116","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Anatomy-Aware Mixture of Experts for Medical Vision-Language Pre-training"],"prefix":"10.1007","author":[{"given":"Kun","family":"Shi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haiwei","family":"Pan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kejia","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,7,17]]},"reference":[{"key":"10_CR1","first-page":"33536","volume":"35","author":"F Wang","year":"2022","unstructured":"Wang, F., Zhou, Y., Wang, S., Vardhanabhuti, V., Yu, L.: Multi-granularity cross-modal alignment for generalized medical visual representation learning. Adv. Neural. Inf. Process. Syst. 35, 33536\u201333549 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"10_CR2","doi-asserted-by":"crossref","unstructured":"Huang, S.C., Shen, L., Lungren, M.P., Yeung, S.: GLoRIA: a multimodal global-local representation learning framework for label-efficient medical image recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3942\u20133951 (2021)","DOI":"10.1109\/ICCV48922.2021.00391"},{"key":"10_CR3","unstructured":"Zhang, Y., Jiang, H., Miura, Y., Manning, C.D., Langlotz, C.P.: Contrastive learning of medical visual representations from paired images and text. In: Machine Learning for Healthcare Conference, pp. 2\u201325. PMLR (2022)"},{"key":"10_CR4","unstructured":"Yang, J., Su, B., Zhao, W.X., Wen, J.R.: Unlocking the Power of Spatial and Temporal Information in Medical Multimodal Pre-training. arXiv preprint arXiv:2405.19654 (2024)"},{"key":"10_CR5","doi-asserted-by":"crossref","unstructured":"Bannur, S., et al.: Learning to exploit temporal structure for biomedical vision-language processing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15016\u201315027 (2023)","DOI":"10.1109\/CVPR52729.2023.01442"},{"issue":"7956","key":"10_CR6","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1038\/s41586-023-05881-4","volume":"616","author":"M Moor","year":"2023","unstructured":"Moor, M., et al.: Foundation models for generalist medical artificial intelligence. Nature 616(7956), 259\u2013265 (2023)","journal-title":"Nature"},{"key":"10_CR7","doi-asserted-by":"crossref","unstructured":"Wang, Z., Wu, Z., Agarwal, D., Sun, J.: MedCLIP: contrastive learning from unpaired medical images and text. In: Proceedings of the Conference on Empirical Methods in Natural Language Processing. Conference on Empirical Methods in Natural Language Processing. vol. 2022, p. 3876 (2022)","DOI":"10.18653\/v1\/2022.emnlp-main.256"},{"key":"10_CR8","doi-asserted-by":"crossref","unstructured":"Wu, C., Zhang, X., Zhang, Y., Wang, Y., Xie, W.: MedKLIP: medical knowledge enhanced language-image pre-training for x-ray diagnosis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 21372\u201321383 (2023)","DOI":"10.1109\/ICCV51070.2023.01954"},{"key":"10_CR9","unstructured":"Zhou, H.Y., Lian, C., Wang, L., Yu, Y.: Advancing Radiograph Representation Learning with Masked Record Modeling. arXiv preprint arXiv:2301.13155 (2023)"},{"key":"10_CR10","doi-asserted-by":"crossref","unstructured":"Boecking, B., et al.: Making the most of text semantics to improve biomedical vision\u2013language processing. In: European Conference on Computer Vision, pp. 1\u201321. Springer (2022)","DOI":"10.1007\/978-3-031-20059-5_1"},{"key":"10_CR11","first-page":"9564","volume":"35","author":"B Mustafa","year":"2022","unstructured":"Mustafa, B., Riquelme, C., Puigcerver, J., Jenatton, R., Houlsby, N.: Multimodal contrastive learning with LIMoE: the language-image mixture of experts. Adv. Neural. Inf. Process. Syst. 35, 9564\u20139576 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"10_CR12","doi-asserted-by":"crossref","unstructured":"Dai, D., et al.: DeepSeekMoe: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models. arXiv preprint arXiv:2401.06066 (2024)","DOI":"10.18653\/v1\/2024.acl-long.70"},{"key":"10_CR13","doi-asserted-by":"crossref","unstructured":"Huang, Q., et al.: Harder Tasks Need More Experts: Dynamic Routing in MoE Models. arXiv preprint arXiv:2403.07652 (2024)","DOI":"10.18653\/v1\/2024.acl-long.696"},{"key":"10_CR14","doi-asserted-by":"crossref","unstructured":"Yang, Y., Qi, S., Gu, W., Wang, C., Gao, C., Xu, Z.: XMoE: Sparse Models with Fine-grained and Adaptive Expert Selection. arXiv preprint arXiv:2403.18926 (2024)","DOI":"10.18653\/v1\/2024.findings-acl.694"},{"key":"10_CR15","unstructured":"Yue, T., Guo, L., Cheng, J., Gao, X., Huang, H., Liu, J.: Ada-K routing: boosting the efficiency of Moe-based LLMs. In: The Thirteenth International Conference on Learning Representations (2024)"},{"key":"10_CR16","unstructured":"Du, N., et al.: GLaM: efficient Scaling of Language Models with Mixture-of-Experts. In: International Conference on Machine Learning, pp. 5547\u20135569. PMLR (2022)"},{"key":"10_CR17","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Medical Image Computing and Computer-Assisted Intervention\u2013MICCAI 2015: 18th International Conference, Munich, Germany, October 5\u20139, 2015, proceedings, part III 18, pp. 234\u2013241. Springer (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"10_CR18","unstructured":"Jia, C., et al.: Scaling up visual and vision-language representation learning with noisy text supervision. In: International Conference on Machine Learning, pp. 4904\u20134916. PMLR (2021)"},{"key":"10_CR19","doi-asserted-by":"crossref","unstructured":"Li, Q., et al.: Anatomical structure-guided medical vision-language pre-training. In: International Conference on Medical Image Computing and Computer-Assisted Intervention, pp. 80\u201390. Springer (2024)","DOI":"10.1007\/978-3-031-72120-5_8"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-0027-7_10","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T12:39:22Z","timestamp":1757248762000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-0027-7_10"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819500260","9789819500277"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-0027-7_10","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"17 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}