{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T14:40:09Z","timestamp":1750516809536,"version":"3.41.0"},"publisher-location":"Cham","reference-count":14,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031958403","type":"print"},{"value":"9783031958410","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-95841-0_64","type":"book-chapter","created":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T14:13:40Z","timestamp":1750515220000},"page":"345-350","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Automated Phenotype-Based Clustering of\u00a0Clinical Reports Using Large Language Models"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7250-8987","authenticated-orcid":false,"given":"Martina","family":"Saletta","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4244-9319","authenticated-orcid":false,"given":"Andrea","family":"Bombarda","sequence":"additional","affiliation":[]},{"given":"Matteo","family":"Bellini","sequence":"additional","affiliation":[]},{"given":"Lucrezia","family":"Goisis","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7780-0434","authenticated-orcid":false,"given":"Paolo","family":"Cazzaniga","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4707-212X","authenticated-orcid":false,"given":"Maria","family":"Iascone","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8391-8049","authenticated-orcid":false,"given":"Domenico Fabio","family":"Savo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,6,22]]},"reference":[{"key":"64_CR1","doi-asserted-by":"crossref","unstructured":"TF\u2013IDF. Encyclopedia of Machine Learning, pp. 986\u2013987. Springer US, Boston, MA (2010)","DOI":"10.1007\/978-0-387-30164-8_832"},{"key":"64_CR2","doi-asserted-by":"crossref","unstructured":"Baddour, M., Paquelet, S., Rollier, P., De\u00a0Tayrac, M., Dameron, O., Labb\u00e9, T.: Phenotypes extraction from text: analysis and perspective in the llm era. In: 2024 IEEE 12th International Conference on Intelligent Systems (IS), pp.\u00a01\u20138. IEEE (2024)","DOI":"10.1109\/IS61756.2024.10705235"},{"key":"64_CR3","doi-asserted-by":"crossref","unstructured":"Bhattarai, K., et al.: Leveraging GPT-4 for identifying cancer phenotypes in electronic health records: a performance comparison between GPT-4, GPT-3.5-turbo, flan-t5, llama-3-8b, and spacy\u2019s rule-based and machine learning-based methods. JAMIA Open 7(3), ooae060 (2024)","DOI":"10.1093\/jamiaopen\/ooae060"},{"key":"64_CR4","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/j.patrec.2020.07.028","volume":"138","author":"MM Fard","year":"2020","unstructured":"Fard, M.M., Thonet, T., Gaussier, \u00c9.: Deep k-means: Jointly clustering with k-means and learning representations. Pattern Recognit. Lett. 138, 185\u2013192 (2020)","journal-title":"Pattern Recognit. Lett."},{"issue":"D1","key":"64_CR5","doi-asserted-by":"publisher","first-page":"D1333","DOI":"10.1093\/nar\/gkad1005","volume":"52","author":"MA Gargano","year":"2023","unstructured":"Gargano, M.A., Matentzoglu, N., Coleman, B., et al.: The human phenotype ontology in 2024: phenotypes around the world. Nucleic Acids Res. 52(D1), D1333\u2013D1346 (2023)","journal-title":"Nucleic Acids Res."},{"key":"64_CR6","unstructured":"MacQueen, J.: Some methods for classification and analysis of multivariate observations. In: Proceedings of 5-th Berkeley Symposium on Mathematical Statistics and Probability\/University of California Press (1967)"},{"issue":"1","key":"64_CR7","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1002\/widm.53","volume":"2","author":"F Murtagh","year":"2012","unstructured":"Murtagh, F., Contreras, P.: Algorithms for hierarchical clustering: an overview. WIREs Data Mining Knowl. Discov. 2(1), 86\u201397 (2012)","journal-title":"WIREs Data Mining Knowl. Discov."},{"issue":"1","key":"64_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.patter.2024.101118","volume":"6","author":"L Qin","year":"2025","unstructured":"Qin, L., et al.: A survey of multilingual large language models. Patterns 6(1), 101118 (2025)","journal-title":"Patterns"},{"key":"64_CR9","doi-asserted-by":"crossref","unstructured":"Roumeliotis, K.I., Tselikas, N.D., Nasiopoulos, D.K.: Llama 2: Early adopters\u2019 utilization of meta\u2019s new open-source pretrained model (2023)","DOI":"10.20944\/preprints202307.2142.v2"},{"key":"64_CR10","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw, P.J.: Silhouettes: a graphical aid to the interpretation and validation of cluster analysis. J. Comput. Appl. Math. 20, 53\u201365 (1987)","journal-title":"J. Comput. Appl. Math."},{"key":"64_CR11","unstructured":"Saletta, M.: https:\/\/github.com\/Martisal\/phenoClustering (2025)"},{"key":"64_CR12","unstructured":"Song, K., Tan, X., Qin, T., Lu, J., Liu, T.: MPNet: Masked and permuted pre-training for language understanding. In: Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS (2020)"},{"issue":"11","key":"64_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/0895-7177(93)90202-A","volume":"18","author":"MS Yang","year":"1993","unstructured":"Yang, M.S.: A survey of fuzzy clustering. Math. Comput. Model. 18(11), 1\u201316 (1993)","journal-title":"Math. Comput. Model."},{"key":"64_CR14","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Zhao, J., Zhang, Q., Gui, T., Huang, X.: Unveiling linguistic regions in large language models. In: Proc. of the 62nd Annual Meeting of the Association for Computational Linguistics, ACL, pp. 6228\u20136247. Association for Computational Linguistics (2024)","DOI":"10.18653\/v1\/2024.acl-long.338"}],"container-title":["Lecture Notes in Computer Science","Artificial Intelligence in Medicine"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-95841-0_64","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T14:13:43Z","timestamp":1750515223000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-95841-0_64"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031958403","9783031958410"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-95841-0_64","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"22 June 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AIME","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Artificial Intelligence in Medicine","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Pavia","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 June 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 June 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aime2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/aime25.aimedicine.info\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}