{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,10]],"date-time":"2026-06-10T05:29:59Z","timestamp":1781069399180,"version":"3.54.1"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T00:00:00Z","timestamp":1738022400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T00:00:00Z","timestamp":1738022400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100003784","name":"Great Ormond Street Hospital for Children","doi-asserted-by":"publisher","award":["21PP30"],"award-info":[{"award-number":["21PP30"]}],"id":[{"id":"10.13039\/501100003784","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003784","name":"Great Ormond Street Hospital for Children","doi-asserted-by":"publisher","award":["21PP30"],"award-info":[{"award-number":["21PP30"]}],"id":[{"id":"10.13039\/501100003784","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003784","name":"Great Ormond Street Hospital for Children","doi-asserted-by":"publisher","award":["21PP30"],"award-info":[{"award-number":["21PP30"]}],"id":[{"id":"10.13039\/501100003784","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Med Inform Decis Mak"],"DOI":"10.1186\/s12911-024-02812-9","type":"journal-article","created":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T16:03:47Z","timestamp":1738080227000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Discovering patient groups in sequential electronic healthcare data using unsupervised representation learning"],"prefix":"10.1186","volume":"25","author":[{"given":"Jingteng","family":"Li","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kimberley R.","family":"Zakka","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"John","family":"Booth","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Louise","family":"Rigny","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Samiran","family":"Ray","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mario","family":"Cortina-Borja","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Payam","family":"Barnaghi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Neil","family":"Sebire","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,1,28]]},"reference":[{"key":"2812_CR1","unstructured":"Ehrenstein V, Kharrazi H, Lehmann H, et\u00a0al. Obtaining Data From Electronic Health Records. In: Gliklich R, Leavy M, Dreyer N, editors. Tools and Technologies for Registry Interoperability, Registries for Evaluating Patient Outcomes: A User\u2019s Guide, 3rd Edition. Rockville: Agency for Healthcare Research and Quality (US); 2019. pp. 10\u201313."},{"issue":"2","key":"2812_CR2","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1145\/3219819.3219904","volume":"169","author":"T Bai","year":"2018","unstructured":"Bai T, Egleston BL, Zhang S, et al. Interpretable Representation Learning for Healthcare via Capturing Disease Progression through Time. KDD. 2018;169(2):43\u201351. https:\/\/doi.org\/10.1145\/3219819.3219904.","journal-title":"KDD."},{"key":"2812_CR3","doi-asserted-by":"publisher","unstructured":"Glover WJ, Li Z, Pachamanova D. The AI-Enhanced Future of Health Care Administrative Task Management. Catal Non-Issue content. 2022;3(2). https:\/\/doi.org\/10.1056\/CAT.21.0355.","DOI":"10.1056\/CAT.21.0355"},{"key":"2812_CR4","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.jbi.2018.06.001","volume":"83","author":"E Parimbelli","year":"2018","unstructured":"Parimbelli E, Marini S, Sacchi L, Bellazzi R. Patient similarity for precision medicine: A systematic review. J Biomed Inform. 2018;83:87\u201396. https:\/\/doi.org\/10.1016\/j.jbi.2018.06.001.","journal-title":"J Biomed Inform."},{"issue":"1","key":"2812_CR5","doi-asserted-by":"publisher","first-page":"e7","DOI":"10.2196\/medinform.6730","volume":"5","author":"A Sharafoddini","year":"2017","unstructured":"Sharafoddini A, Dubin JA, Lee J. Patient Similarity in Prediction Models Based on Health Data: A Scoping Review. JMIR Med Inform. 2017;5(1):e7. https:\/\/doi.org\/10.2196\/medinform.6730.","journal-title":"JMIR Med Inform."},{"issue":"9","key":"2812_CR6","doi-asserted-by":"publisher","first-page":"825","DOI":"10.1056\/NEJMsa1102519","volume":"365","author":"RD Cebul","year":"2011","unstructured":"Cebul RD, Love TE, Jain AK, Hebert CJ. Electronic Health Records and Quality of Diabetes Care. N Engl J Med. 2011;365(9):825\u201333. https:\/\/doi.org\/10.1056\/NEJMsa1102519.","journal-title":"N Engl J Med."},{"issue":"18","key":"2812_CR7","doi-asserted-by":"publisher","first-page":"1715","DOI":"10.1056\/NEJMsa1406552","volume":"371","author":"JM McWilliams","year":"2014","unstructured":"McWilliams JM, Landon BE, Chernew ME, Zaslavsky AM. Changes in Patients\u2019 Experiences in Medicare Accountable Care Organizations. N Engl J Med. 2014;371(18):1715\u201324. https:\/\/doi.org\/10.1056\/NEJMsa1406552.","journal-title":"N Engl J Med."},{"issue":"1\u201302","key":"2812_CR8","first-page":"32","volume":"60","author":"JH Holmes","year":"2021","unstructured":"Holmes JH, Beinlich J, Boland MR, Bowles KH, Chen Y, Cook TS, et al. Why Is the Electronic Health Record So Challenging for Research and Clinical Care? Methods Inf Med. 2021;60(1\u201302):32\u201348.","journal-title":"Methods Inf Med."},{"key":"2812_CR9","doi-asserted-by":"publisher","unstructured":"Berisha V, Krantsevich C, Hahn P, Hahn S, Dasarathy G, Turaga P, et\u00a0al. Digital medicine and the curse of dimensionality. npj Digit Med. 2021;4. https:\/\/doi.org\/10.1038\/s41746-021-00521-5.","DOI":"10.1038\/s41746-021-00521-5"},{"key":"2812_CR10","doi-asserted-by":"publisher","unstructured":"Sauer C, Chen L, Hyland S, et\u00a0al. Leveraging electronic health records for data science: common pitfalls and how to avoid them. Lancet Digit Health The. 2022;4(12). https:\/\/doi.org\/10.1016\/S2589-7500(22)00154-6.","DOI":"10.1016\/S2589-7500(22)00154-6"},{"issue":"10","key":"2812_CR11","doi-asserted-by":"publisher","first-page":"1419","DOI":"10.1093\/jamia\/ocy068","volume":"25","author":"C Xiao","year":"2018","unstructured":"Xiao C, Choi E, Sun J. Opportunities and challenges in developing deep learning models using electronic health records data: a systematic review. J Am Med Inform Assoc. 2018;25(10):1419\u201328. https:\/\/doi.org\/10.1093\/jamia\/ocy068.","journal-title":"J Am Med Inform Assoc."},{"issue":"2","key":"2812_CR12","doi-asserted-by":"publisher","first-page":"94","DOI":"10.7861\/futurehosp.6-2-94","volume":"6","author":"T Davenport","year":"2019","unstructured":"Davenport T, Kalakota R. The potential for artificial intelligence in healthcare. Future Healthc J. 2019;6(2):94\u20138.","journal-title":"Future Healthc J."},{"key":"2812_CR13","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1016\/j.tacc.2021.02.007","volume":"38","author":"S Locke","year":"2021","unstructured":"Locke S, Bashall A, Al-Adely S, Moore J, Wilson A, Kitchen GB. Natural language processing in medicine: A review. Trends Anaesthesia Crit Care. 2021;38:4\u20139. https:\/\/doi.org\/10.1016\/j.tacc.2021.02.007.","journal-title":"Trends Anaesthesia Crit Care."},{"key":"2812_CR14","unstructured":"Le Q, Mikolov T. Distributed representations of sentences and documents. In: Proceedings of the 31st International Conference on International Conference on Machine Learning - Volume 32. Beijing: JMLR.org; 2014. p II-1188-II\u20131196."},{"key":"2812_CR15","doi-asserted-by":"publisher","unstructured":"Feng Y, Min X, Chen N, Chen H, Xie X, Wang H, et\u00a0al. Patient outcome prediction via convolutional neural networks based on multi-granularity medical concept embedding. In: 2017 IEEE International Conference on Bioinformatics and Biomedicine (BIBM). 2017. pp. 770\u20137. https:\/\/doi.org\/10.1109\/BIBM.2017.8217753.","DOI":"10.1109\/BIBM.2017.8217753"},{"issue":"2","key":"2812_CR16","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1186\/s12911-017-0468-7","volume":"17","author":"Z Liu","year":"2017","unstructured":"Liu Z, Yang M, Wang X, Chen Q, Tang B, Wang Z, et al. Entity recognition from clinical texts via recurrent neural network. BMC Med Inform Decis Making. 2017;17(2):67. https:\/\/doi.org\/10.1186\/s12911-017-0468-7.","journal-title":"BMC Med Inform Decis Making."},{"key":"2812_CR17","doi-asserted-by":"crossref","unstructured":"Choi E, Bahadori MT, Searles E, Coffey C, Thompson M, Bost J, Tejedor-Sojo J, Sun J. Multi-layer Representation Learning for Medical Concepts. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining. San Francisco: Association for Computing Machinery; 2016. p 1495\u2013504.","DOI":"10.1145\/2939672.2939823"},{"key":"2812_CR18","doi-asserted-by":"publisher","unstructured":"Zhu Z, Yin C, Qian B, Cheng Y, Wei J, Wang F. Measuring Patient Similarities via a Deep Architecture with Medical Concept Embedding. In: 2016 IEEE 16th International Conference on Data Mining (ICDM). 2016. pp. 749\u201358. https:\/\/doi.org\/10.1109\/ICDM.2016.0086.","DOI":"10.1109\/ICDM.2016.0086"},{"key":"2812_CR19","unstructured":"Choi E, Bahadori MT, Schuetz A, Stewart WF, Sun J. Doctor AI: Predicting Clinical Events via Recurrent Neural Networks. In: Doshi-Velez F, Fackler J, Kale D, Wallace B, Wiens J, editors. Proceedings of the 1st Machine Learning for Healthcare Conference. vol.\u00a056 of Proceedings of Machine Learning Research. Northeastern University. Boston: PMLR; 2016. pp. 301\u201318. https:\/\/proceedings.mlr.press\/v56\/Choi16.html."},{"key":"2812_CR20","unstructured":"Great Ormond Street Hospital for Children - Who We Are. https:\/\/www.gosh.nhs.uk\/about-us\/who-we-are\/. Accessed 30 Mar 2023."},{"key":"2812_CR21","doi-asserted-by":"publisher","unstructured":"Caroprese L, Veltri P, Vocaturo E, Zumpano E. Deep Learning Techniques for Electronic Health Record Analysis. 2018. pp. 1\u20134. https:\/\/doi.org\/10.1109\/IISA.2018.8633647.","DOI":"10.1109\/IISA.2018.8633647"},{"key":"2812_CR22","doi-asserted-by":"publisher","unstructured":"Li Y, Rao S, Solares J, et\u00a0al. BEHRT: Transformer for Electronic Health Records. Sci Rep. 2020;10(1). https:\/\/doi.org\/10.1038\/s41598-020-62922-y.","DOI":"10.1038\/s41598-020-62922-y"},{"key":"2812_CR23","doi-asserted-by":"publisher","unstructured":"Rasmy L, Xiang Y, Xie Z, et\u00a0al. Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction. npj Digit Med. 2021;4(86). https:\/\/doi.org\/10.1038\/s41746-021-00455-y.","DOI":"10.1038\/s41746-021-00455-y"},{"key":"2812_CR24","unstructured":"Devlin J, Chang M-W, Lee K, Toutanova K. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In: Burstein J, Doran C, Solorio T (eds) Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2019 Vol 1 (Long and Short Papers). Minneapolis: Association for Computational Linguistics; 2019. p 4171\u201386."},{"key":"2812_CR25","unstructured":"Mikolov T, Chen K, Corrado G, Dean J. Efficient Estimation of Word Representations in Vector Space. In: Bengio Y, LeCun Y (eds) 1st International Conference on Learning Representations, ICLR 2013. Scottsdale: Workshop Track Proceedings; 2013."},{"key":"2812_CR26","doi-asserted-by":"publisher","unstructured":"Davis J, Goadrich M. The Relationship between Precision-Recall and ROC Curves. In: Proceedings of the 23rd International Conference on Machine Learning. ICML \u201906. New York: Association for Computing Machinery; 2006. pp. 233\u201340. https:\/\/doi.org\/10.1145\/1143844.1143874.","DOI":"10.1145\/1143844.1143874"},{"issue":"3","key":"2812_CR27","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1561\/2200000008","volume":"2","author":"U Von Luxburg","year":"2010","unstructured":"Von Luxburg U. Clustering Stability: An Overview. Found Trends Mach Learn. 2010;2(3):235\u201374. https:\/\/doi.org\/10.1561\/2200000008.","journal-title":"Found Trends Mach Learn."},{"key":"2812_CR28","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw PJ. Silhouettes: A graphical aid to the interpretation and validation of cluster analysis. J Comput Appl Math. 1987;20:53\u201365. https:\/\/doi.org\/10.1016\/0377-0427(87)90125-7.","journal-title":"J Comput Appl Math."},{"key":"2812_CR29","doi-asserted-by":"publisher","unstructured":"Fukunaga K, Olsen DR. An Algorithm for Finding Intrinsic Dimensionality of Data. IEEE Trans Comput. 1971;C-20(2):176\u2013183. https:\/\/doi.org\/10.1109\/T-C.1971.223208.","DOI":"10.1109\/T-C.1971.223208"},{"issue":"1","key":"2812_CR30","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1186\/1745-6150-2-2","volume":"2","author":"R Cangelosi","year":"2007","unstructured":"Cangelosi R, Goriely A. Component retention in principal component analysis with application to cDNA microarray data. Biol Direct. 2007;2(1):2. https:\/\/doi.org\/10.1186\/1745-6150-2-2.","journal-title":"Biol Direct."},{"key":"2812_CR31","doi-asserted-by":"publisher","unstructured":"Williams K, Thomson D, Seto I, Contopoulos-Ioannidis DG, Ioannidis JPA, Curtis S, et\u00a0al. Standard 6: Age Groups for Pediatric Trials. Pediatrics. 2012;129(Supplement_3):S153\u2013S160. https:\/\/doi.org\/10.1542\/peds.2012-0055I.","DOI":"10.1542\/peds.2012-0055I"},{"issue":"3","key":"2812_CR32","doi-asserted-by":"publisher","first-page":"e0118432","DOI":"10.1371\/journal.pone.0118432","volume":"10","author":"T Saito","year":"2015","unstructured":"Saito T, Rehmsmeier M. The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets. PLoS One. 2015;10(3):e0118432.","journal-title":"PLoS One."},{"key":"2812_CR33","doi-asserted-by":"publisher","unstructured":"Jiffry M, Khan A, Pires F, Okam N, Vargas J, Moin K, et\u00a0al. Agranulocytosis Secondary to Cancer Chemotherapy Associated With Higher In-Hospital Mortality in Patients With Central Line Insertion During a Hospital Stay. Cureus. 2023;15. https:\/\/doi.org\/10.7759\/cureus.34717.","DOI":"10.7759\/cureus.34717"},{"issue":"1","key":"2812_CR34","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1016\/j.amjcard.2014.03.063","volume":"114","author":"C Nyboe","year":"2014","unstructured":"Nyboe C, Olsen MS, Nielsen-Kudsk JE, Johnsen SP, Hjortdal VE. Risk of Pneumonia in Adults With Closed Versus Unclosed Atrial Septal Defect (from a Nationwide Cohort Study). Am J Cardiol. 2014;114(1):105\u201310. https:\/\/doi.org\/10.1016\/j.amjcard.2014.03.063.","journal-title":"Am J Cardiol."},{"key":"2812_CR35","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I. Attention is all you need. In: Proceedings of the 31st International Conference on Neural Information Processing Systems. Long Beach: Curran Associates Inc.; 2017. p 6000\u20136010"},{"issue":"1","key":"2812_CR36","doi-asserted-by":"publisher","first-page":"160035","DOI":"10.1038\/sdata.2016.35","volume":"3","author":"AEW Johnson","year":"2016","unstructured":"Johnson AEW, Pollard TJ, Shen L, Lehman LWH, Feng M, Ghassemi M, et al. MIMIC-III, a freely accessible critical care database. Sci Data. 2016;3(1):160035. https:\/\/doi.org\/10.1038\/sdata.2016.35.","journal-title":"Sci Data."}],"container-title":["BMC Medical Informatics and Decision Making"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12911-024-02812-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12911-024-02812-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12911-024-02812-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T16:03:53Z","timestamp":1738080233000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcmedinformdecismak.biomedcentral.com\/articles\/10.1186\/s12911-024-02812-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,28]]},"references-count":36,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["2812"],"URL":"https:\/\/doi.org\/10.1186\/s12911-024-02812-9","relation":{},"ISSN":["1472-6947"],"issn-type":[{"value":"1472-6947","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,1,28]]},"assertion":[{"value":"10 July 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 December 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 January 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The use of de-identified, routinely collected electronic healthcare data was approved by the London-South East Research Ethics Committee under REC approval [21\/LO\/0646]: Use of routine healthcare and operational hospital data for research. The research data obtained from GOSH DRE was de-identified in which patient-identifiable information has been redacted. In accordance with the UK Policy Framework for Health and Social Care Research, the requirement for informed consent in this study were waived following approval from GOSH.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The Authors declare no competing financial or non-financial interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"45"}}