{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T11:22:18Z","timestamp":1777893738437,"version":"3.51.4"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2019,4,8]],"date-time":"2019-04-08T00:00:00Z","timestamp":1554681600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"name":"NIH","award":["R21LM012618-01"],"award-info":[{"award-number":["R21LM012618-01"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Healthc Inform Res"],"published-print":{"date-parts":[[2019,9]]},"DOI":"10.1007\/s41666-019-00046-3","type":"journal-article","created":{"date-parts":[[2019,4,9]],"date-time":"2019-04-09T01:02:33Z","timestamp":1554771753000},"page":"283-299","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":38,"title":["Identifying Breast Cancer Distant Recurrences from Electronic Health Records Using Machine Learning"],"prefix":"10.1007","volume":"3","author":[{"given":"Zexian","family":"Zeng","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Liang","family":"Yao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ankita","family":"Roy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoyu","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sasa","family":"Espino","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Susan E","family":"Clare","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Seema A","family":"Khan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0195-7456","authenticated-orcid":false,"given":"Yuan","family":"Luo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,4,8]]},"reference":[{"issue":"15","key":"46_CR1","doi-asserted-by":"publisher","first-page":"1726","DOI":"10.1001\/jama.2010.1525","volume":"304","author":"JR Egner","year":"2010","unstructured":"Egner JR (2010) AJCC cancer staging manual. JAMA 304(15):1726\u20131727","journal-title":"JAMA"},{"issue":"11","key":"46_CR2","doi-asserted-by":"publisher","first-page":"2813","DOI":"10.1002\/cncr.10572","volume":"94","author":"MG L\u00ea","year":"2002","unstructured":"L\u00ea MG, Arriagada R, Spielmann M, Guinebreti\u00e8re JM, Rochard F (2002) Prognostic factors for death after an isolated local recurrence in patients with early-stage breast carcinoma. Cancer 94(11):2813\u20132820","journal-title":"Cancer"},{"issue":"5","key":"46_CR3","doi-asserted-by":"publisher","first-page":"966","DOI":"10.1002\/cncr.22472","volume":"109","author":"AM Geiger","year":"2007","unstructured":"Geiger AM, Thwin SS, Lash TL, Buist DSM, Prout MN, Wei F, Field TS, Ulcickas Yood M, Frost FJ, Enger SM, Silliman RA (2007) Recurrences and second primary breast cancers in older women with initial early-stage disease. Cancer 109(5):966\u2013974","journal-title":"Cancer"},{"issue":"6","key":"46_CR4","doi-asserted-by":"publisher","first-page":"R85","DOI":"10.1186\/bcr2453","volume":"11","author":"LA Habel","year":"2009","unstructured":"Habel LA, Achacoso NS, Haque R, Nekhlyudov L, Fletcher SW, Schnitt SJ, Collins LC, Geiger AM, Puligandla B, Acton L, Quesenberry CP (2009) Declining recurrence among ductal carcinoma in situ patients treated with breast-conserving surgery in the community setting. Breast Cancer Res 11(6):R85","journal-title":"Breast Cancer Res"},{"issue":"4","key":"46_CR5","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1111\/cts.12294","volume":"8","author":"JB Starren","year":"2015","unstructured":"Starren JB, Winter AQ, Lloyd-Jones DM (2015) Enabling a learning health system through a unified enterprise data warehouse: the experience of the Northwestern University Clinical and Translational Sciences (NUCATS) Institute. Clin Transl Sci 8(4):269\u2013271","journal-title":"Clin Transl Sci"},{"issue":"5","key":"46_CR6","doi-asserted-by":"publisher","first-page":"480","DOI":"10.1097\/01.mlr.0000160417.39497.a9","volume":"43","author":"E Birman-Deych","year":"2005","unstructured":"Birman-Deych E, Waterman AD, Yan Y, Nilasena DS, Radford MJ, Gage BF (2005) Accuracy of ICD-9-CM codes for identifying cardiovascular and stroke risk factors. Med Care 43(5):480\u2013485","journal-title":"Med Care"},{"issue":"6","key":"46_CR7","doi-asserted-by":"publisher","first-page":"952","DOI":"10.1002\/art.20827","volume":"51","author":"JA Singh","year":"2004","unstructured":"Singh JA, Holmgren AR, Noorbaloochi S (2004) Accuracy of Veterans Administration databases for a diagnosis of rheumatoid arthritis. Arthritis Care Res 51(6):952\u2013957","journal-title":"Arthritis Care Res"},{"issue":"5p2","key":"46_CR8","doi-asserted-by":"publisher","first-page":"1620","DOI":"10.1111\/j.1475-6773.2005.00444.x","volume":"40","author":"KJ O'malley","year":"2005","unstructured":"O'malley KJ, Cook KF, Price MD, Wildes KR, Hurdle JF, Ashton CM (2005) Measuring diagnoses: ICD code accuracy. Health Serv Res 40(5p2):1620\u20131639","journal-title":"Health Serv Res"},{"issue":"1","key":"46_CR9","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1136\/amiajnl-2012-001145","volume":"20","author":"G Hripcsak","year":"2012","unstructured":"Hripcsak G, Albers DJ (2012) Next-generation phenotyping of electronic health records. J Am Med Inform Assoc 20(1):117\u2013121","journal-title":"J Am Med Inform Assoc"},{"issue":"7179","key":"46_CR10","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1136\/bmj.318.7179.323","volume":"318","author":"T Greenhalgh","year":"1999","unstructured":"Greenhalgh T (1999) Narrative based medicine: narrative based medicine in an evidence based world. BMJ Br Med J 318(7179):323\u2013325","journal-title":"BMJ Br Med J"},{"issue":"8","key":"46_CR11","doi-asserted-by":"publisher","first-page":"1120","DOI":"10.1002\/acr.20184","volume":"62","author":"KP Liao","year":"2010","unstructured":"Liao KP, Cai T, Gainer V, Goryachev S, Zeng-treitler Q, Raychaudhuri S, Szolovits P, Churchill S, Murphy S, Kohane I, Karlson EW, Plenge RM (2010) Electronic medical records for discovery research in rheumatoid arthritis. Arthritis Care Res 62(8):1120\u20131127","journal-title":"Arthritis Care Res"},{"key":"46_CR12","unstructured":"G. Chao and S. Sun, \"Applying a multitask feature sparsity method for the classification of semantic relations between nominals,\" in Machine Learning and Cybernetics (ICMLC), 2012 International Conference on, 2012, vol. 1, pp. 72\u201376: IEEE"},{"key":"46_CR13","doi-asserted-by":"crossref","unstructured":"Luo Y et al (2017) Natural language processing for EHR-based pharmacovigilance: a structured review. Drug Saf:1\u201315","DOI":"10.1007\/s40264-017-0558-6"},{"key":"46_CR14","unstructured":"Zeng Z, Deng Y, Li X, Naumann T, Luo Y (2018) Natural language processing for EHR-based computational phenotyping. IEEE\/ACM Transactions on Computational Biology and Bioinformatics:1\u20131"},{"key":"46_CR15","doi-asserted-by":"crossref","unstructured":"D. S. Carrell, S. Halgrim, D.T. Tran, D. S. M. Buist, J. Chubak, W. W. Chapman, G. Savova, \"Using natural language processing to improve efficiency of manual chart abstraction in research: the case of breast cancer recurrence,\" American journal of epidemiology, p. kwt441, 2014, 179, 749, 758","DOI":"10.1093\/aje\/kwt441"},{"issue":"2","key":"46_CR16","doi-asserted-by":"publisher","first-page":"349","DOI":"10.1136\/amiajnl-2012-000928","volume":"20","author":"JA Strauss","year":"2013","unstructured":"Strauss JA, Chao CR, Kwan ML, Ahmed SA, Schottinger JE, Quinn VP (2013) Identifying primary and recurrent cancers using a SAS-based natural language processing algorithm. J Am Med Inform Assoc 20(2):349\u2013355","journal-title":"J Am Med Inform Assoc"},{"issue":"11","key":"46_CR17","doi-asserted-by":"publisher","first-page":"2979","DOI":"10.1158\/1055-9965.EPI-09-0607","volume":"18","author":"JL Bosco","year":"2009","unstructured":"Bosco JL et al (2009) Breast cancer recurrence in older women five to ten years after diagnosis. Cancer Epidemiology and Prevention Biomarkers 18(11):2979\u20132983","journal-title":"Cancer Epidemiology and Prevention Biomarkers"},{"issue":"4","key":"46_CR18","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1097\/MLR.0000000000000327","volume":"53","author":"R Haque","year":"2015","unstructured":"Haque R, Shi J, Schottinger JE, Ahmed SA, Chung J, Avila C, Lee VS, Cheetham TC, Habel LA, Fletcher SW, Kwan ML (2015) A hybrid approach to identify subsequent breast cancer using pathology and automated health information data. Med Care 53(4):380\u2013385","journal-title":"Med Care"},{"key":"46_CR19","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1200\/jco.2014.32.30_suppl.164","volume":"32","author":"LP Wallner","year":"2014","unstructured":"Wallner LP, Dibello JR, Li BH, Zheng C, Yu W, Weinmann S, Richert-Boe KE, Ritzwoller DP, VanDenEeden SK, Jacobsen SJ (2014) Development of an algorithm to identify metastatic prostate cancer in electronic medical records using natural language processing. Proc Am Soc Clin Oncol 32:164","journal-title":"Proc Am Soc Clin Oncol"},{"key":"46_CR20","first-page":"137","volume":"ECML-98","author":"T Joachims","year":"1998","unstructured":"Joachims T (1998) Text categorization with support vector machines: learning with many relevant features. Mach Learn ECML-98:137\u2013142","journal-title":"Mach Learn"},{"issue":"5","key":"46_CR21","doi-asserted-by":"publisher","first-page":"869","DOI":"10.1016\/j.jbi.2013.06.014","volume":"46","author":"V Garla","year":"2013","unstructured":"Garla V, Taylor C, Brandt C (2013) Semi-supervised clinical text classification with Laplacian SVMs: an application to cancer case management. J Biomed Inform 46(5):869\u2013875","journal-title":"J Biomed Inform"},{"issue":"5","key":"46_CR22","doi-asserted-by":"publisher","first-page":"817","DOI":"10.1136\/amiajnl-2011-000752","volume":"19","author":"CA Bejan","year":"2012","unstructured":"Bejan CA, Xia F, Vanderwende L, Wurfel MM, Yetisgen-Yildiz M (2012) Pneumonia identification using statistical feature selection. J Am Med Inform Assoc 19(5):817\u2013823","journal-title":"J Am Med Inform Assoc"},{"issue":"6","key":"46_CR23","doi-asserted-by":"publisher","first-page":"736","DOI":"10.1197\/jamia.M2130","volume":"14","author":"IA McCowan","year":"2007","unstructured":"McCowan IA, Moore DC, Nguyen AN, Bowman RV, Clarke BE, Duhig EE, Fry MJ (2007) Collection of cancer stage data by classifying free-text medical reports. J Am Med Inform Assoc 14(6):736\u2013745","journal-title":"J Am Med Inform Assoc"},{"key":"46_CR24","unstructured":"Z. Zeng et al., \"Contralateral breast cancer event detection using Nature Language Processing,\" in AMIA Annual Symposium Proceedings, 2017, vol. 2017, pp. 1885\u20131892: American Medical Informatics Association"},{"key":"46_CR25","unstructured":"R. J. Carroll, A. E. Eyler, and J. C. Denny, \"Na\u00efve electronic health record phenotype identification for rheumatoid arthritis,\" in AMIA annual symposium proceedings, 2011, vol. 2011, p. 189: American Medical Informatics Association"},{"issue":"4","key":"46_CR26","doi-asserted-by":"publisher","first-page":"351","DOI":"10.1197\/jamia.M1176","volume":"10","author":"JC Denny","year":"2003","unstructured":"Denny JC, Smithers JD, Miller RA, Spickard A III (2003) \u201cUnderstanding\u201d medical school curriculum content using KnowledgeMap. J Am Med Inform Assoc 10(4):351\u2013362","journal-title":"J Am Med Inform Assoc"},{"key":"46_CR27","doi-asserted-by":"crossref","unstructured":"Y. Kim, \"Convolutional neural networks for sentence classification,\" arXiv preprint arXiv:1408.5882, 2014","DOI":"10.3115\/v1\/D14-1181"},{"key":"46_CR28","doi-asserted-by":"crossref","unstructured":"N. Kalchbrenner, E. Grefenstette, and P. Blunsom, \"A convolutional neural network for modelling sentences,\" arXiv preprint arXiv:1404.2188, 2014","DOI":"10.3115\/v1\/P14-1062"},{"key":"46_CR29","doi-asserted-by":"crossref","unstructured":"K. S. Tai, R. Socher, and C. D. Manning, \"Improved semantic representations from tree-structured long short-term memory networks,\" arXiv preprint arXiv:1503.00075, 2015","DOI":"10.3115\/v1\/P15-1150"},{"key":"46_CR30","doi-asserted-by":"crossref","unstructured":"Z. Yang, D. Yang, C. Dyer, X. He, A. Smola, and E. Hovy, \"Hierarchical attention networks for document classification,\" in Proceedings of the 2016 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, 2016, pp. 1480\u20131489","DOI":"10.18653\/v1\/N16-1174"},{"key":"46_CR31","unstructured":"S. Gehrmann et al., \"Comparing Rule-Based and Deep Learning Models for Patient Phenotyping,\" arXiv preprint arXiv:1703.08705, 2017"},{"key":"46_CR32","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1016\/j.jbi.2017.07.006","volume":"72","author":"Y Luo","year":"2017","unstructured":"Luo Y (2017) Recurrent neural networks for classifying relations in clinical notes. J Biomed Inform 72:85\u201395","journal-title":"J Biomed Inform"},{"issue":"1","key":"46_CR33","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1093\/jamia\/ocx090","volume":"25","author":"Y Luo","year":"2017","unstructured":"Luo Y, Cheng Y, Uzuner \u00d6, Szolovits P, Starren J (2017) Segment convolutional neural networks (Seg-CNNs) for classifying relations in clinical notes. J Am Med Inform Assoc 25(1):93\u201398","journal-title":"J Am Med Inform Assoc"},{"key":"46_CR34","first-page":"624","volume":"216","author":"Y Wu","year":"2015","unstructured":"Wu Y, Jiang M, Lei J, Xu H (2015) Named entity recognition in Chinese clinical text using deep neural network. Studies in health technology and informatics 216:624","journal-title":"Studies in health technology and informatics"},{"key":"46_CR35","doi-asserted-by":"crossref","unstructured":"A. N. Jagannatha and H. Yu, \"Structured prediction models for RNN based sequence labeling in clinical text,\" in Proceedings of the Conference on Empirical Methods in Natural Language Processing Conference on Empirical Methods in Natural Language Processing, 2016, vol. 2016, p. 856: NIH Public Access","DOI":"10.18653\/v1\/D16-1082"},{"key":"46_CR36","doi-asserted-by":"crossref","unstructured":"A. N. Jagannatha and H. Yu, \"Bidirectional rnn for medical event detection in electronic health records,\" in Proceedings of the conference Association for Computational Linguistics North American Chapter Meeting, 2016, vol. 2016, p. 473: NIH Public Access","DOI":"10.18653\/v1\/N16-1056"},{"issue":"8","key":"46_CR37","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0070944","volume":"8","author":"S DeLisle","year":"2013","unstructured":"DeLisle S, Kim B, Deepak J, Siddiqui T, Gundlapalli A, Samore M, D'Avolio L (2013) Using the electronic medical record to identify community-acquired pneumonia: toward a replicable automated strategy. PLoS One 8(8):e70944","journal-title":"PLoS One"},{"issue":"e1","key":"46_CR38","doi-asserted-by":"publisher","first-page":"e151","DOI":"10.1136\/amiajnl-2014-002642","volume":"22","author":"C Lin","year":"2014","unstructured":"Lin C, Karlson EW, Dligach D, Ramirez MP, Miller TA, Mo H, Braggs NS, Cagan A, Gainer V, Denny JC, Savova GK (2014) Automatic identification of methotrexate-induced liver toxicity in patients with rheumatoid arthritis from the electronic medical record. J Am Med Inform Assoc 22(e1):e151\u2013e161","journal-title":"J Am Med Inform Assoc"},{"key":"46_CR39","doi-asserted-by":"publisher","first-page":"h1885","DOI":"10.1136\/bmj.h1885","volume":"350","author":"KP Liao","year":"2015","unstructured":"Liao KP, Cai T, Savova GK, Murphy SN, Karlson EW, Ananthakrishnan AN, Gainer VS, Shaw SY, Xia Z, Szolovits P, Churchill S, Kohane I (2015) Development of phenotype algorithms using electronic medical records and incorporating natural language processing. bmj 350:h1885","journal-title":"bmj"},{"key":"46_CR40","doi-asserted-by":"crossref","unstructured":"F. Galton, Finger prints. Macmillan and Company, 1892","DOI":"10.2307\/2842054"},{"issue":"2","key":"46_CR41","doi-asserted-by":"publisher","first-page":"452","DOI":"10.1002\/1097-0142(19930115)71:2<452::AID-CNCR2820710228>3.0.CO;2-B","volume":"71","author":"CR Leemans","year":"1993","unstructured":"Leemans CR, Tiwari R, Nauta J, Van der Waal I, Snow GB (1993) Regional lymph node involvement and its significance in the development of distant metastases in head and neck carcinoma. Cancer 71(2):452\u2013456","journal-title":"Cancer"},{"key":"46_CR42","unstructured":"A. R. Aronson, \"Metamap: mapping text to the umls metathesaurus,\" Bethesda, MD: NLM, NIH, DHHS, pp. 1\u201326, 2006"},{"key":"46_CR43","first-page":"677","volume":"192","author":"WW Chapman","year":"2013","unstructured":"Chapman WW et al (2013) Extending the NegEx lexicon for multiple languages. Stud Health Technol Inform 192:677","journal-title":"Stud Health Technol Inform"},{"key":"46_CR44","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F et al (2011) Scikit-learn: machine learning in Python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"46_CR45","doi-asserted-by":"crossref","unstructured":"L. De Vine, G. Zuccon, B. Koopman, L. Sitbon, and P. Bruza, \"Medical semantic similarity with a neural language model,\" in Proceedings of the 23rd ACM international conference on conference on information and knowledge management, 2014, pp. 1819\u20131822: ACM","DOI":"10.1145\/2661829.2661974"},{"key":"46_CR46","unstructured":"M. Abadi et al, \"Tensorflow: a system for large-scale machine learning,\" in OSDI, 2016, vol. 16, pp. 265\u2013283"},{"key":"46_CR47","unstructured":"D. Kinga and J. B. Adam, \"A method for stochastic optimization,\" in International Conference on Learning Representations (ICLR), 2015, vol. 5"},{"key":"46_CR48","doi-asserted-by":"crossref","unstructured":"Luo Y, Xin Y, Hochberg E, Joshi R, Uzuner O, Szolovits P (2015) Subgraph augmented non-negative tensor factorization (SANTF) for modeling clinical narrative text. J Am Med Inform Assoc:ocv016","DOI":"10.1093\/jamia\/ocv016"},{"issue":"5","key":"46_CR49","doi-asserted-by":"publisher","first-page":"824","DOI":"10.1136\/amiajnl-2013-002443","volume":"21","author":"Y Luo","year":"2014","unstructured":"Luo Y, Sohani AR, Hochberg EP, Szolovits P (2014) Automatic lymphoma classification with sentence subgraph mining from pathology reports. J Am Med Inform Assoc 21(5):824\u2013832","journal-title":"J Am Med Inform Assoc"},{"key":"46_CR50","doi-asserted-by":"publisher","first-page":"e232","DOI":"10.1136\/amiajnl-2013-001932","volume":"20","author":"MR Boland","year":"2013","unstructured":"Boland MR, Hripcsak G, Shen Y, Chung WK, Weng C (2013) Defining a comprehensive verotype using electronic health records for personalized medicine. J Am Med Inform Assoc 20:e232\u2013e238","journal-title":"J Am Med Inform Assoc"}],"container-title":["Journal of Healthcare Informatics Research"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41666-019-00046-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s41666-019-00046-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41666-019-00046-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,6]],"date-time":"2020-04-06T23:14:06Z","timestamp":1586214846000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s41666-019-00046-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,4,8]]},"references-count":50,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2019,9]]}},"alternative-id":["46"],"URL":"https:\/\/doi.org\/10.1007\/s41666-019-00046-3","relation":{},"ISSN":["2509-4971","2509-498X"],"issn-type":[{"value":"2509-4971","type":"print"},{"value":"2509-498X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,4,8]]},"assertion":[{"value":"12 July 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 November 2018","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 January 2019","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 April 2019","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}