{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T18:38:04Z","timestamp":1743100684986,"version":"3.40.3"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031665370"},{"type":"electronic","value":"9783031665387"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-66538-7_19","type":"book-chapter","created":{"date-parts":[[2024,7,25]],"date-time":"2024-07-25T17:02:07Z","timestamp":1721926927000},"page":"182-191","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Smoking Status Classification: A Comparative Analysis of\u00a0Machine Learning Techniques with\u00a0Clinical Real World Data"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4674-0146","authenticated-orcid":false,"given":"Amila","family":"Kugic","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4926-9727","authenticated-orcid":false,"given":"Akhila","family":"Abdulnazar","sequence":"additional","affiliation":[]},{"given":"Anto","family":"Knezovic","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7222-3287","authenticated-orcid":false,"given":"Stefan","family":"Schulz","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9824-9004","authenticated-orcid":false,"given":"Markus","family":"Kreuzthaler","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,25]]},"reference":[{"key":"19_CR1","doi-asserted-by":"publisher","unstructured":"Bae, Y.S., et al.: Keyword extraction algorithm for classifying smoking status from unstructured bilingual electronic health records based on natural language processing. Appl. Sci. 11(19), 8812 (2021). https:\/\/doi.org\/10.3390\/app11198812, https:\/\/www.mdpi.com\/2076-3417\/11\/19\/8812","DOI":"10.3390\/app11198812"},{"key":"19_CR2","doi-asserted-by":"publisher","unstructured":"Bressem, K.K., et\u00a0al.: medbert.de: a comprehensive German bert model for the medical domain. Expert Syst. Appl. 237, 121598 (2024). https:\/\/doi.org\/10.1016\/j.eswa.2023.121598, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0957417423021000","DOI":"10.1016\/j.eswa.2023.121598"},{"key":"19_CR3","doi-asserted-by":"crossref","unstructured":"Caccamisi, A., J\u00f8rgensen, L., Dalianis, H., Rosenlund, M.: Natural language processing and machine learning to enable automatic extraction and classification of patients\u2019 smoking status from electronic medical records. Upsala J. Med. Sci. 125(4), 316\u2013324 (2020)","DOI":"10.1080\/03009734.2020.1792010"},{"key":"19_CR4","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding, May 2019. https:\/\/doi.org\/10.48550\/arXiv.1810.04805, http:\/\/arxiv.org\/abs\/1810.04805, arXiv:1810.04805 [cs]","DOI":"10.48550\/arXiv.1810.04805"},{"key":"19_CR5","doi-asserted-by":"publisher","unstructured":"Hacker, K., Houry, D.: Social needs and social determinants: the role of the centers for disease control and prevention and public health. Public Health Rep. 137(6), 1049\u20131052 (2022). https:\/\/doi.org\/10.1177\/00333549221120244, publisher: SAGE Publications Inc","DOI":"10.1177\/00333549221120244"},{"key":"19_CR6","doi-asserted-by":"publisher","unstructured":"Haque, M.A., Gedara, M.L.B., Nickel, N., Turgeon, M., Lix, L.M.: The validity of electronic health data for measuring smoking status: a systematic review and meta-analysis. BMC Med. Inform. Decision Making 24(1), 33 (2024). https:\/\/doi.org\/10.1186\/s12911-024-02416-3. https:\/\/bmcmedinformdecismak.biomedcentral.com\/articles\/10.1186\/s12911-024-02416-3","DOI":"10.1186\/s12911-024-02416-3"},{"key":"19_CR7","doi-asserted-by":"publisher","unstructured":"Howard, J., Ruder, S.: Universal language model fine-tuning for text classification. In: Gurevych, I., Miyao, Y. (eds.) Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 328\u2013339. Melbourne, Australia (2018). https:\/\/doi.org\/10.18653\/v1\/P18-1031, https:\/\/aclanthology.org\/P18-1031","DOI":"10.18653\/v1\/P18-1031"},{"key":"19_CR8","doi-asserted-by":"publisher","unstructured":"Johnson, A.E., et\u00a0al.: MIMIC-III, a freely accessible critical care database. Sci. Data 3(1), 160035 (2016). https:\/\/doi.org\/10.1038\/sdata.2016.35. https:\/\/www.nature.com\/articles\/sdata201635","DOI":"10.1038\/sdata.2016.35"},{"key":"19_CR9","doi-asserted-by":"publisher","unstructured":"Karlsson, A., et\u00a0al.: Impact of deep learning-determined smoking status on mortality of cancer patients: never too late to quit. ESMO Open 6(3), 100175 (2021). https:\/\/doi.org\/10.1016\/j.esmoop.2021.100175. https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S2059702921001356","DOI":"10.1016\/j.esmoop.2021.100175"},{"key":"19_CR10","unstructured":"Knezovic, A.: Extraction and standardization of smoking status from free-text clinical routine documentation using machine learning methods. Master\u2019s thesis, Medical University of Graz (2023)"},{"key":"19_CR11","doi-asserted-by":"publisher","unstructured":"Kukhareva, P.V., et\u00a0al.: Inaccuracies in electronic health records smoking data and a potential approach to address resulting underestimation in determining lung cancer screening eligibility. J. Am. Med. Inform. Assoc. 29(5), 779\u2013788 (2022). https:\/\/doi.org\/10.1093\/jamia\/ocac020, https:\/\/academic.oup.com\/jamia\/article\/29\/5\/779\/6529026","DOI":"10.1093\/jamia\/ocac020"},{"key":"19_CR12","unstructured":"Lu, W., et\u00a0al.: Tobacco and chronic obstructive pulmonary disease (COPD). World Health Organization, November 2023. https:\/\/www.who.int\/publications-detail-redirect\/9789240084452"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"McHugh, M.L.: Interrater reliability: the Kappa statistic. Biochemia medica 22(3), 276\u2013282 (2012)","DOI":"10.11613\/BM.2012.031"},{"key":"19_CR14","doi-asserted-by":"publisher","first-page":"160940691989922","DOI":"10.1177\/1609406919899220","volume":"19","author":"C O\u2019Connor","year":"2020","unstructured":"O\u2019Connor, C., Joffe, H.: Intercoder reliability in qualitative research: debates and practical guidelines. Int J Qual Methods 19, 1609406919899220 (2020)","journal-title":"Int J Qual Methods"},{"key":"19_CR15","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., et al.: Scikit-learn: machine learning in Python. J. Mach. Learn. Res. 12, 2825\u20132830 (2011)","journal-title":"J. Mach. Learn. Res."},{"key":"19_CR16","doi-asserted-by":"crossref","unstructured":"Peng, Y., Yan, S., Lu, Z.: Transfer learning in biomedical natural language processing: an evaluation of bert and elmo on ten benchmarking datasets. In: Proceedings of the 2019 Workshop on Biomedical Natural Language Processing (BioNLP 2019), pp. 58\u201365 (2019)","DOI":"10.18653\/v1\/W19-5006"},{"key":"19_CR17","unstructured":"Rajendran, S., Topaloglu, U.: Extracting smoking status from electronic health records using NLP and deep learning. AMIA Summits Transl. Sci. Proc. 2020, 507\u2013516 (2020). https:\/\/www.ncbi.nlm.nih.gov\/pmc\/articles\/PMC7233082\/"},{"key":"19_CR18","doi-asserted-by":"publisher","unstructured":"Ruckdeschel, J.C., Riley, M., Parsatharathy, S., Chamarthi, R., Rajagopal, C., Hsu, H.S., Mangold, D., Driscoll, C.: Unstructured Data Are Superior to Structured Data for Eliciting Quantitative Smoking History From the Electronic Health Record. JCO clinical cancer informatics 7, e2200155 (Feb 2023). https:\/\/doi.org\/10.1200\/CCI.22.00155","DOI":"10.1200\/CCI.22.00155"},{"key":"19_CR19","doi-asserted-by":"publisher","unstructured":"Schwarz, C.M., et al.: Structure, content, unsafe abbreviations, and completeness of discharge summaries: a retrospective analysis in a University Hospital in Austria. J. Eval. Clin. Practice 27(6), 1243\u20131251 (2021). https:\/\/doi.org\/10.1111\/jep.13533, https:\/\/onlinelibrary.wiley.com\/doi\/10.1111\/jep.13533","DOI":"10.1111\/jep.13533"},{"key":"19_CR20","doi-asserted-by":"publisher","unstructured":"Stabellini, N., et al.: Social determinants of health data improve the prediction of cardiac outcomes in females with breast cancer. Cancers 15(18), 4630 (2023). https:\/\/doi.org\/10.3390\/cancers15184630, https:\/\/www.ncbi.nlm.nih.gov\/pmc\/articles\/PMC10526347\/","DOI":"10.3390\/cancers15184630"},{"key":"19_CR21","unstructured":"The Apache Software Foundation: UIMA. Unstructured Information Management Architecture (2010). https:\/\/uima.apache.org\/"},{"key":"19_CR22","unstructured":"WHO: The European Health Report 2021. Taking stock of the health-related Sustainable Development Goals in the COVID-19 era with a focus on leaving no one behind. World Health Organization, March 2022. https:\/\/www.who.int\/europe\/publications\/i\/item\/9789289057547"},{"key":"19_CR23","doi-asserted-by":"publisher","unstructured":"Wilkinson, M.D., et\u00a0al.: The FAIR guiding principles for scientific data management and stewardship. Sci. Data 3(1) (2016). https:\/\/doi.org\/10.1038\/sdata.2016.18, https:\/\/doi.org\/10.1038\/sdata.2016.18","DOI":"10.1038\/sdata.2016.18"},{"key":"19_CR24","unstructured":"World Health Organization (ed.): European health report 2018: more than numbers - evidence for all. Regional Office for Europe, Copenhague (2018). https:\/\/iris.who.int\/handle\/10665\/279904"},{"key":"19_CR25","doi-asserted-by":"publisher","unstructured":"Yang, X., et al.: A natural language processing tool to extract quantitative smoking status from clinical narratives. In: 2020 IEEE International Conference on Healthcare Informatics (ICHI), pp.\u00a01\u20132, November 2020. https:\/\/doi.org\/10.1109\/ICHI48887.2020.9374369. https:\/\/ieeexplore.ieee.org\/document\/9374369, iSSN: 2575-2634","DOI":"10.1109\/ICHI48887.2020.9374369"},{"key":"19_CR26","unstructured":"Yu, Z., et al.: A study of social and behavioral determinants of health in lung cancer patients using transformers-based natural language processing models. In: AMIA Annual Symposium Proceedings 2021, pp. 1225\u20131233, February 2022. https:\/\/www.ncbi.nlm.nih.gov\/pmc\/articles\/PMC8861705\/"}],"container-title":["Lecture Notes in Computer Science","Artificial Intelligence in Medicine"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-66538-7_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,25]],"date-time":"2024-07-25T17:04:10Z","timestamp":1721927050000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-66538-7_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031665370","9783031665387"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-66538-7_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"25 July 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AIME","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Artificial Intelligence in Medicine","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Salt Lake City, UT","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"USA","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 July 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 July 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aime2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/aime24.aimedicine.info\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}