{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T06:29:14Z","timestamp":1774333754739,"version":"3.50.1"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032049773","type":"print"},{"value":"9783032049780","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T00:00:00Z","timestamp":1758240000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T00:00:00Z","timestamp":1758240000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-04978-0_53","type":"book-chapter","created":{"date-parts":[[2025,9,18]],"date-time":"2025-09-18T16:16:22Z","timestamp":1758212182000},"page":"554-564","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Revisiting Automatic Data Curation for\u00a0Vision Foundation Models in\u00a0Digital Pathology"],"prefix":"10.1007","author":[{"given":"Boqi","family":"Chen","sequence":"first","affiliation":[]},{"given":"C\u00e9dric","family":"Vincent-Cuaz","sequence":"additional","affiliation":[]},{"given":"Lydia A.","family":"Schoenpflug","sequence":"additional","affiliation":[]},{"given":"Manuel","family":"Madeira","sequence":"additional","affiliation":[]},{"given":"Lisa","family":"Fournier","sequence":"additional","affiliation":[]},{"given":"Vaishnavi","family":"Subramanian","sequence":"additional","affiliation":[]},{"given":"Sonali","family":"Andani","sequence":"additional","affiliation":[]},{"given":"Samuel","family":"Ruiperez-Campillo","sequence":"additional","affiliation":[]},{"given":"Julia E.","family":"Vogt","sequence":"additional","affiliation":[]},{"given":"Rapha\u00eblle","family":"Luisier","sequence":"additional","affiliation":[]},{"given":"Dorina","family":"Thanou","sequence":"additional","affiliation":[]},{"given":"Viktor H.","family":"Koelzer","sequence":"additional","affiliation":[]},{"given":"Pascal","family":"Frossard","sequence":"additional","affiliation":[]},{"given":"Gabriele","family":"Campanella","sequence":"additional","affiliation":[]},{"given":"Gunnar","family":"R\u00e4tsch","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,19]]},"reference":[{"key":"53_CR1","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1016\/j.media.2019.05.010","volume":"56","author":"G Aresta","year":"2019","unstructured":"Aresta, G., et al.: Bach: grand challenge on breast cancer histology images. Med. Image Anal. 56, 122\u2013139 (2019)","journal-title":"Med. Image Anal."},{"key":"53_CR2","doi-asserted-by":"crossref","unstructured":"Barbano, C.A., et al.: Unitopatho, a labeled histopathological dataset for colorectal polyps classification and adenoma dysplasia grading. In: 2021 IEEE International Conference on Image Processing (ICIP), pp. 76\u201380. IEEE (2021)","DOI":"10.1109\/ICIP42928.2021.9506198"},{"key":"53_CR3","doi-asserted-by":"crossref","unstructured":"Brancati, N., et\u00a0al.: Bracs: a dataset for breast carcinoma subtyping in h &e histology images. Database 2022, baac093 (2022)","DOI":"10.1093\/database\/baac093"},{"key":"53_CR4","doi-asserted-by":"crossref","unstructured":"Campanella, G., et al.: Clinical-grade computational pathology using weakly supervised deep learning on whole slide images. Nat. Med. 25(8), 1301\u20131309 (2019)","DOI":"10.1038\/s41591-019-0508-1"},{"key":"53_CR5","doi-asserted-by":"crossref","unstructured":"Caron, M., et al.: Emerging properties in self-supervised vision transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9650\u20139660 (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"issue":"3","key":"53_CR6","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1038\/s41591-024-02857-3","volume":"30","author":"RJ Chen","year":"2024","unstructured":"Chen, R.J., et al.: Towards a general-purpose foundation model for computational pathology. Nat. Med. 30(3), 850\u2013862 (2024)","journal-title":"Nat. Med."},{"key":"53_CR7","unstructured":"Chen, S., et\u00a0al.: Benchmarking embedding aggregation methods in computational pathology: a clinical data perspective. arXiv preprint arXiv:2407.07841 (2024)"},{"key":"53_CR8","unstructured":"Dippel, J., et\u00a0al.: Rudolfv: a foundation model by pathologists for pathologists. arXiv preprint arXiv:2401.04079 (2024)"},{"key":"53_CR9","unstructured":"Dosovitskiy, A.: An image is worth $$16 \\times 16$$ words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"53_CR10","unstructured":"Geifman, Y., El-Yaniv, R.: Deep active learning over the long tail. arXiv preprint arXiv:1711.00941 (2017)"},{"key":"53_CR11","unstructured":"Han, C., et\u00a0al.: Wsss4luad: grand challenge on weakly-supervised tissue semantic segmentation for lung adenocarcinoma. arXiv preprint arXiv:2204.06455 (2022)"},{"key":"53_CR12","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked autoencoders are scalable vision learners. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16000\u201316009 (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"53_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2024.103143","volume":"94","author":"F H\u00f6rst","year":"2024","unstructured":"H\u00f6rst, F., et al.: Cellvit: vision transformers for precise cell segmentation and classification. Med. Image Anal. 94, 103143 (2024)","journal-title":"Med. Image Anal."},{"key":"53_CR14","doi-asserted-by":"crossref","unstructured":"Hosseini, M.S., et al.: Atlas of digital pathology: a generalized hierarchical histological tissue type-annotated database for deep learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11747\u201311756 (2019)","DOI":"10.1109\/CVPR.2019.01202"},{"key":"53_CR15","unstructured":"Ilse, M., Tomczak, J., Welling, M.: Attention-based deep multiple instance learning. In: International Conference on Machine Learning, pp. 2127\u20132136. PMLR (2018)"},{"issue":"1","key":"53_CR16","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pmed.1002730","volume":"16","author":"JN Kather","year":"2019","unstructured":"Kather, J.N., et al.: Predicting survival from colorectal cancer histology slides using deep learning: a retrospective multicenter study. PLoS Med. 16(1), e1002730 (2019)","journal-title":"PLoS Med."},{"key":"53_CR17","unstructured":"Oquab, M., et\u00a0al.: Dinov2: learning robust visual features without supervision. arXiv preprint arXiv:2304.07193 (2023)"},{"key":"53_CR18","first-page":"19523","volume":"35","author":"B Sorscher","year":"2022","unstructured":"Sorscher, B., Geirhos, R., Shekhar, S., Ganguli, S., Morcos, A.: Beyond neural scaling laws: beating power law scaling via data pruning. Adv. Neural Inf. Process. Syst. 35, 19523\u201319536 (2022)","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"7","key":"53_CR19","doi-asserted-by":"publisher","first-page":"1455","DOI":"10.1109\/TBME.2015.2496264","volume":"63","author":"FA Spanhol","year":"2015","unstructured":"Spanhol, F.A., Oliveira, L.S., Petitjean, C., Heutte, L.: A dataset for breast cancer histopathological image classification. IEEE Trans. Biomed. Eng. 63(7), 1455\u20131462 (2015)","journal-title":"IEEE Trans. Biomed. Eng."},{"key":"53_CR20","unstructured":"Toneva, M., Sordoni, A., Combes, R.T.D., Trischler, A., Bengio, Y., Gordon, G.J.: An empirical study of example forgetting during deep neural network learning. arXiv preprint arXiv:1812.05159 (2018)"},{"key":"53_CR21","unstructured":"Vo, H.V., et\u00a0al.: Automatic data curation for self-supervised learning: a clustering-based approach. arXiv preprint arXiv:2405.15613 (2024)"},{"key":"53_CR22","doi-asserted-by":"publisher","unstructured":"Vo, H.V., Sim\u00e9oni, O., Gidaris, S., Bursuc, A., P\u00e9rez, P., Ponce, J.: Active learning strategies for weakly-supervised object detection. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022. ECCV 2022. LNCS, vol. 13690, pp. 211\u2013230. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20056-4_13","DOI":"10.1007\/978-3-031-20056-4_13"},{"key":"53_CR23","unstructured":"Vorontsov, E., et\u00a0al.: Virchow: a million-slide digital pathology foundation model. arXiv preprint arXiv:2309.07778 (2023)"},{"key":"53_CR24","unstructured":"Xu, H., et\u00a0al.: A whole-slide foundation model for digital pathology from real-world data. Nature 1\u20138 (2024)"},{"issue":"1","key":"53_CR25","doi-asserted-by":"publisher","first-page":"6796","DOI":"10.1038\/s41467-023-42504-y","volume":"14","author":"S Zhao","year":"2023","unstructured":"Zhao, S., et al.: Single-cell morphological and topological atlas reveals the ecosystem diversity of human breast cancer. Nat. Commun. 14(1), 6796 (2023)","journal-title":"Nat. Commun."},{"issue":"4","key":"53_CR26","doi-asserted-by":"publisher","first-page":"881","DOI":"10.1109\/TMI.2021.3125459","volume":"41","author":"C Zhu","year":"2021","unstructured":"Zhu, C., Chen, W., Peng, T., Wang, Y., Jin, M.: Hard sample aware noise robust learning for histopathology image classification. IEEE Trans. Med. Imaging 41(4), 881\u2013894 (2021)","journal-title":"IEEE Trans. Med. Imaging"}],"container-title":["Lecture Notes in Computer Science","Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2025"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-04978-0_53","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,18]],"date-time":"2025-09-18T22:07:30Z","timestamp":1758233250000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-04978-0_53"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,19]]},"ISBN":["9783032049773","9783032049780"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-04978-0_53","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,19]]},"assertion":[{"value":"19 September 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"MICCAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Medical Image Computing and Computer-Assisted Intervention","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Daejeon","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Korea (Republic of)","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 September 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"miccai2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/conferences.miccai.org\/2025\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}