{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T15:58:29Z","timestamp":1772121509195,"version":"3.50.1"},"reference-count":49,"publisher":"Elsevier BV","issue":"7","license":[{"start":{"date-parts":[[2021,7,1]],"date-time":"2021-07-01T00:00:00Z","timestamp":1625097600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2021,7,1]],"date-time":"2021-07-01T00:00:00Z","timestamp":1625097600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2021,5,20]],"date-time":"2021-05-20T00:00:00Z","timestamp":1621468800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000070","name":"National Institute of Biomedical Imaging and Bioengineering","doi-asserted-by":"publisher","award":["R56 EB020527"],"award-info":[{"award-number":["R56 EB020527"]}],"id":[{"id":"10.13039\/100000070","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["cell.com","elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Patterns"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1016\/j.patter.2021.100289","type":"journal-article","created":{"date-parts":[[2021,6,17]],"date-time":"2021-06-17T10:30:13Z","timestamp":1623925813000},"page":"100289","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":23,"title":["Structuring clinical text with AI: Old versus new natural language processing techniques evaluated on eight common cardiovascular diseases"],"prefix":"10.1016","volume":"2","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7058-2603","authenticated-orcid":false,"given":"Xianghao","family":"Zhan","sequence":"first","affiliation":[]},{"given":"Marie","family":"Humbert-Droz","sequence":"additional","affiliation":[]},{"given":"Pritam","family":"Mukherjee","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9965-5466","authenticated-orcid":false,"given":"Olivier","family":"Gevaert","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.patter.2021.100289_bib1","article-title":"Embedding electronic health records for clinical information retrieval","author":"Wei","year":"2018","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib2","doi-asserted-by":"crossref","first-page":"e12239","DOI":"10.2196\/12239","article-title":"Natural language processing of clinical notes on chronic diseases: systematic review","volume":"7","author":"Sheikhalishahi","year":"2019","journal-title":"JMIR Med. Inform."},{"key":"10.1016\/j.patter.2021.100289_bib3","series-title":"Machine Learning for Healthcare Conference","first-page":"301","article-title":"Doctor AI: predicting clinical events via recurrent neural networks","author":"Choi","year":"2016"},{"key":"10.1016\/j.patter.2021.100289_bib4","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1016\/j.jbi.2017.11.011","article-title":"Clinical information extraction applications: a literature review","volume":"77","author":"Wang","year":"2018","journal-title":"J.\u00a0Biomed. Inform."},{"key":"10.1016\/j.patter.2021.100289_bib5","doi-asserted-by":"crossref","first-page":"26094","DOI":"10.1038\/srep26094","article-title":"Deep patient: an unsupervised representation to predict the future of patients from the electronic health records","volume":"6","author":"Miotto","year":"2016","journal-title":"Sci. Rep."},{"key":"10.1016\/j.patter.2021.100289_bib6","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1038\/nrg3208","article-title":"Mining electronic health records: towards better research applications and clinical care","volume":"13","author":"Jensen","year":"2012","journal-title":"Nat. Rev. Genet."},{"key":"10.1016\/j.patter.2021.100289_bib7","doi-asserted-by":"crossref","first-page":"198","DOI":"10.1093\/jamia\/ocw042","article-title":"Opportunities and challenges in developing risk prediction models with electronic health records data: a systematic review","volume":"24","author":"Goldstein","year":"2017","journal-title":"J.\u00a0Am. Med. Inform. Assoc."},{"key":"10.1016\/j.patter.2021.100289_bib8","article-title":"Implicit negative feedback in clinical information retrieval","author":"Kuhn","year":"2016","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib9","article-title":"Explainable prediction of medical codes from clinical text","author":"Mullenbach","year":"2018","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib10","doi-asserted-by":"crossref","first-page":"891","DOI":"10.1097\/TA.0000000000002194","article-title":"A trauma mortality prediction model based on the ICD-10-CM lexicon: TMPM-ICD10","volume":"86","author":"Osler","year":"2019","journal-title":"J.\u00a0Trauma Acute Care Surg."},{"key":"10.1016\/j.patter.2021.100289_bib11","series-title":"ICD-10 International Statistical Classification of Diseases and Related Health Problems","year":"2008"},{"key":"10.1016\/j.patter.2021.100289_bib12","doi-asserted-by":"crossref","first-page":"460","DOI":"10.1001\/jamacardio.2019.0716","article-title":"Misclassification of myocardial injury as myocardial infarction: implications for assessing outcomes in value-based programs","volume":"4","author":"McCarthy","year":"2019","journal-title":"JAMA Cardiol."},{"key":"10.1016\/j.patter.2021.100289_bib13","doi-asserted-by":"crossref","first-page":"e003056","DOI":"10.1161\/JAHA.115.003056","article-title":"Accuracy of ICD-9-CM codes by hospital characteristics and stroke severity: Paul Coverdell national acute stroke program","volume":"5","author":"Chang","year":"2016","journal-title":"J.\u00a0Am. Heart Assoc."},{"key":"10.1016\/j.patter.2021.100289_bib14","doi-asserted-by":"crossref","first-page":"1602","DOI":"10.1161\/01.STR.29.8.1602","article-title":"Accuracy of ICD-9-CM coding for the identification of patients with acute ischemic stroke: effect of modifier codes","volume":"29","author":"Goldstein","year":"1998","journal-title":"Stroke"},{"key":"10.1016\/j.patter.2021.100289_bib15","first-page":"912","article-title":"Accuracy and completeness of clinical coding using ICD-10 for ambulatory visits","author":"Horsky","year":"2017"},{"key":"10.1016\/j.patter.2021.100289_bib16","first-page":"11","article-title":"A statistical interpretation of term specificity and its application in retrieval","volume":"28","author":"Jones","year":"1972","journal-title":"J.\u00a0Doc."},{"key":"10.1016\/j.patter.2021.100289_bib17","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1186\/s13023-018-0830-6","article-title":"Next generation phenotyping using narrative reports in a rare disease clinical data warehouse","volume":"13","author":"Garcelon","year":"2018","journal-title":"Orphanet J. Rare Dis."},{"key":"10.1016\/j.patter.2021.100289_bib18","article-title":"Unsupervised learning of sentence embeddings using compositional n-gram features","author":"Pagliardini","year":"2017","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib19","article-title":"Towards universal paraphrastic sentence embeddings","author":"Wieting","year":"2015","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib20","series-title":"5th International Conference on Learning Representations","article-title":"A simple but tough-to-beat baseline for sentence embeddings","author":"Arora","year":"2017"},{"key":"10.1016\/j.patter.2021.100289_bib21","series-title":"Proceedings of the Conference and Labs of the Evaluation Forum CEUR Workshop","first-page":"1","article-title":"Transformers in semantic indexing of clinical codes","author":"Rishivardhan","year":"2020"},{"key":"10.1016\/j.patter.2021.100289_bib22","series-title":"Advances in Neural Information Processing Systems 17 (NIPS 2004)","first-page":"849","article-title":"Semi-supervised learning with penalized probabilistic clustering","author":"Lu","year":"2005"},{"key":"10.1016\/j.patter.2021.100289_bib23","series-title":"Proceedings of the IET Doctoral Forum on Biomedical Engineering, Healthcare, Robotics and Artificial Intelligence 2018 (BRAIN 2018)","article-title":"Online conformal prediction for classifying different types of herbal medicines with electronic noise","author":"Zhan","year":"2018"},{"key":"10.1016\/j.patter.2021.100289_bib24","doi-asserted-by":"crossref","first-page":"107588","DOI":"10.1016\/j.measurement.2020.107588","article-title":"An electronic nose-based assistive diagnostic prototype for lung cancer detection with conformal prediction","volume":"158","author":"Zhan","year":"2020","journal-title":"Measurement"},{"key":"10.1016\/j.patter.2021.100289_bib25","first-page":"149","article-title":"An information extraction framework for cohort identification using electronic health records","volume":"2013","author":"Liu","year":"2013","journal-title":"AMIA Jt Summits Transl. Sci. Proc."},{"key":"10.1016\/j.patter.2021.100289_bib26","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1038\/s41746-019-0208-8","article-title":"Desiderata for delivering NLP to accelerate healthcare AI advancement and a Mayo Clinic NLP-as-a-service implementation","volume":"2","author":"Wen","year":"2019","journal-title":"NPJ Digit. Med."},{"key":"10.1016\/j.patter.2021.100289_bib27","doi-asserted-by":"crossref","first-page":"i446","DOI":"10.1093\/bioinformatics\/btz342","article-title":"Deep learning with multimodal representation for pancancer prognosis prediction","volume":"35","author":"Cheerla","year":"2019","journal-title":"Bioinformatics"},{"key":"10.1016\/j.patter.2021.100289_bib28","doi-asserted-by":"crossref","first-page":"70","DOI":"10.1016\/j.ebiom.2019.06.034","article-title":"Development and validation of radiomic signatures of head and neck squamous cell carcinoma molecular features and subtypes","volume":"45","author":"Huang","year":"2019","journal-title":"EBioMedicine"},{"key":"10.1016\/j.patter.2021.100289_bib29","doi-asserted-by":"crossref","first-page":"274","DOI":"10.1038\/s42256-020-0173-6","article-title":"A shallow convolutional neural network predicts prognosis of lung cancer patients in multi-institutional computed tomography image datasets","volume":"2","author":"Mukherjee","year":"2020","journal-title":"Nat. Mach. Intelligence"},{"key":"10.1016\/j.patter.2021.100289_bib30","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1038\/s41746-021-00446-z","article-title":"AI-based analysis of CT images for rapid triage of COVID-19 patients","volume":"4","author":"Xu","year":"2021","journal-title":"NPJ Digital Med."},{"key":"10.1016\/j.patter.2021.100289_bib31","series-title":"Proceedings of the LREC 2010 Workshop on New Challenges for NLP Frameworks","first-page":"45","article-title":"Software framework for topic modelling with large corpora","author":"Rehurek","year":"2010"},{"key":"10.1016\/j.patter.2021.100289_bib32","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","article-title":"An algorithm for suffix stripping","volume":"14","author":"Porter","year":"1980","journal-title":"Program"},{"key":"10.1016\/j.patter.2021.100289_bib33","series-title":"Natural Language Processing with Python: Analyzing Text with the Natural Language Toolkit","author":"Bird","year":"2009"},{"key":"10.1016\/j.patter.2021.100289_bib34","doi-asserted-by":"crossref","first-page":"146","DOI":"10.1080\/00437956.1954.11659520","article-title":"Distributional structure","volume":"10","author":"Harris","year":"1954","journal-title":"Word"},{"key":"10.1016\/j.patter.2021.100289_bib35","article-title":"Distributed representations of words and phrases and their compositionality","author":"Mikolov","year":"2013","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib36","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1038\/s41597-019-0055-0","article-title":"BioWordVec, improving biomedical word embeddings with subword information and MeSH","volume":"6","author":"Zhang","year":"2019","journal-title":"Sci. Data"},{"key":"10.1016\/j.patter.2021.100289_bib37","series-title":"31st International Conference on Machine Learning","first-page":"1188","article-title":"Distributed representations of sentences and documents","volume":"32","author":"Le","year":"2014"},{"key":"10.1016\/j.patter.2021.100289_bib38","first-page":"2579","article-title":"Visualizing data using t-SNE","volume":"9","author":"Van der Maaten","year":"2008","journal-title":"J.\u00a0Machine Learn. Res."},{"key":"10.1016\/j.patter.2021.100289_bib39","series-title":"2016 IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI)","first-page":"595","article-title":"Nonlinear dimension reduction for EEG-based epileptic seizure detection.","author":"Birjandtalab","year":"2016"},{"key":"10.1016\/j.patter.2021.100289_bib40","article-title":"Boost AI power: data augmentation strategies with unlabelled data and conformal prediction, a case in alternative herbal medicine discrimination with electronic nose","author":"Liu","year":"2021","journal-title":"arXiv"},{"key":"10.1016\/j.patter.2021.100289_bib41","doi-asserted-by":"crossref","first-page":"1750017","DOI":"10.1142\/S0219720017500172","article-title":"Application of t-SNE to human genetic data","volume":"15","author":"Li","year":"2017","journal-title":"J.\u00a0Bioinform. Comput. Biol."},{"key":"10.1016\/j.patter.2021.100289_bib42","doi-asserted-by":"crossref","first-page":"215","DOI":"10.1111\/j.2517-6161.1958.tb00292.x","article-title":"The regression analysis of binary sequences","volume":"20","author":"Cox","year":"1958","journal-title":"J.\u00a0R. Stat. Soc. Ser. B (Methodol.)"},{"key":"10.1016\/j.patter.2021.100289_bib43","first-page":"2825","article-title":"Scikit-learn: machine learning in Python","volume":"12","author":"Pedregosa","year":"2011","journal-title":"J.\u00a0Mach. Learn. Res."},{"key":"10.1016\/j.patter.2021.100289_bib44","series-title":"Proceedings of the 23rd International Conference on Machine Learning","first-page":"233","article-title":"The relationship between Precision-Recall and ROC curves","author":"Davis","year":"2006"},{"key":"10.1016\/j.patter.2021.100289_bib45","series-title":"Breakthroughs in Statistics","first-page":"569","article-title":"Bootstrap methods: another look at the jackknife","author":"Efron","year":"1992"},{"key":"10.1016\/j.patter.2021.100289_bib46","doi-asserted-by":"crossref","first-page":"160035","DOI":"10.1038\/sdata.2016.35","article-title":"MIMIC-III, a freely accessible critical care database","volume":"3","author":"Johnson","year":"2016","journal-title":"Sci. Data"},{"key":"10.1016\/j.patter.2021.100289_bib47","first-page":"844","article-title":"Reusable filtering functions for application in ICU data: a case study","author":"Major","year":"2016"},{"key":"10.1016\/j.patter.2021.100289_bib48","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1016\/j.cmpb.2019.05.024","article-title":"An empirical evaluation of deep learning for ICD-9 code assignment using MIMIC-III clinical notes","volume":"177","author":"Huang","year":"2019","journal-title":"Comput. Methods Programs Biomed."},{"key":"10.1016\/j.patter.2021.100289_bib49","series-title":"The International Classification of Diseases: Ninth Revision (ICD-9)","author":"Slee","year":"1978"}],"container-title":["Patterns"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2666389921001227?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S2666389921001227?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,11,12]],"date-time":"2025-11-12T23:44:38Z","timestamp":1762991078000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S2666389921001227"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7]]},"references-count":49,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["S2666389921001227"],"URL":"https:\/\/doi.org\/10.1016\/j.patter.2021.100289","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2021.01.27.21250477","asserted-by":"object"}]},"ISSN":["2666-3899"],"issn-type":[{"value":"2666-3899","type":"print"}],"subject":[],"published":{"date-parts":[[2021,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Structuring clinical text with AI: Old versus new natural language processing techniques evaluated on eight common cardiovascular diseases","name":"articletitle","label":"Article Title"},{"value":"Patterns","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.patter.2021.100289","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2021 The Authors.","name":"copyright","label":"Copyright"}],"article-number":"100289"}}