{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T10:42:11Z","timestamp":1761561731538},"reference-count":59,"publisher":"Oxford University Press (OUP)","issue":"5","content-domain":{"domain":["bmj.com"],"crossmark-restriction":true},"short-container-title":["J Am Med Inform Assoc"],"published-print":{"date-parts":[[2013,9]]},"DOI":"10.1136\/amiajnl-2012-001453","type":"journal-article","created":{"date-parts":[[2013,3,14]],"date-time":"2013-03-14T03:25:40Z","timestamp":1363231540000},"page":"931-939","update-policy":"http:\/\/dx.doi.org\/10.1136\/crossmarkpolicy","source":"Crossref","is-referenced-by-count":28,"title":["Improving performance of natural language processing part-of-speech tagging on clinical narratives through domain adaptation"],"prefix":"10.1093","volume":"20","author":[{"given":"Jeffrey P","family":"Ferraro","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"suffix":"III","given":"Hal","family":"Daum\u00e9","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Scott L","family":"DuVall","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wendy W","family":"Chapman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Henk","family":"Harkema","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peter J","family":"Haug","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2013,9,1]]},"reference":[{"key":"2015062501525251000_20.5.931.1","unstructured":"Haug PJ Christensen L Gundersen M . A natural language parsing system for encoding admitting diagnoses. Proceedings of AMIA Annual Fall Symposium; 1997:814\u201318."},{"key":"2015062501525251000_20.5.931.2","unstructured":"Haug PJ Koehler SB Christensen LM . Inventors; Probabilistic method for natural language processing and for encoding free-text data into a medical database by utilizing a Bayesian network to perform spell checking of words. US patent 6292771. Alexandria, VA: United States Patent and Trademark Office, 2001 Sept 18."},{"key":"2015062501525251000_20.5.931.3","unstructured":"Jain NL Friedman C . Identification of findings suspicious for breast cancer based on natural language processing of mammogram reports. Proceedings of AMIA Annual Fall Symposium; 1997:829\u201333."},{"key":"2015062501525251000_20.5.931.4","unstructured":"Jain NL Knirsch CA Friedman C . Identification of suspected tuberculosis patients based on natural language processing of chest radiograph reports. Proceedings of AMIA Annual Fall Symposium; 1996:542\u20136."},{"key":"2015062501525251000_20.5.931.5","doi-asserted-by":"crossref","unstructured":"Jones B Ferraro JP Haug P . Performance of a real-time electronic screening tool for pneumonia [abstract]. Am J Respir Crit Care Med 2012;185:A5136.","DOI":"10.1164\/ajrccm-conference.2012.185.1_MeetingAbstracts.A5136"},{"key":"2015062501525251000_20.5.931.6","doi-asserted-by":"publisher","DOI":"10.1111\/j.1553-2712.2012.01445.x"},{"key":"2015062501525251000_20.5.931.7","doi-asserted-by":"crossref","unstructured":"Chang MW Do Q Roth D . Multilingual dependency parsing: a pipeline approach. In: Nicolov N Bontcheva K Angelova G . Recent advances in natural language processing IV. Amsterdam: John Benjamins Publishing Co., 2007:55\u201378.","DOI":"10.1075\/cilt.292.10cha"},{"key":"2015062501525251000_20.5.931.8","doi-asserted-by":"crossref","unstructured":"Finkel JR Manning CD Ng AY . Solving the problem of cascading errors: approximate Bayesian inference for linguistic annotation pipelines. Proceedings of EMNLP; 2006:618\u201326.","DOI":"10.3115\/1610075.1610162"},{"key":"2015062501525251000_20.5.931.9","doi-asserted-by":"publisher","DOI":"10.1136\/amiajnl-2011-000465"},{"key":"2015062501525251000_20.5.931.10","unstructured":"UMLS Reference Manual. Specialist lexicon and lexical tools. Bethesda, MD: National Library of Medicine (US); http:\/\/www.ncbi.nlm.nih.gov\/books\/NBK9680\/ (accessed 7 Jul 2012)."},{"key":"2015062501525251000_20.5.931.11","unstructured":"Campbell DA Johnson SB . A transformational-based learner for dependency grammars in discharge summaries. Proceedings of ACL; 2002;3:37\u201344."},{"key":"2015062501525251000_20.5.931.12","doi-asserted-by":"publisher","DOI":"10.3115\/991250.991346"},{"key":"2015062501525251000_20.5.931.13","doi-asserted-by":"crossref","unstructured":"Florian R Ngai G . Multidimensional transformation-based learning. Proceedings of the 2001 Workshop on Computational Natural Language Learning; 2001;7: 1\u20138.","DOI":"10.3115\/1117822.1117823"},{"key":"2015062501525251000_20.5.931.14","doi-asserted-by":"crossref","unstructured":"Kim J Schwarm SE Ostendorf M . Detecting structural metadata with decision trees and transformation-based learning. Proceedings of HLT\/NAACL; 2004:137\u201344.","DOI":"10.21236\/ADA457891"},{"key":"2015062501525251000_20.5.931.15","doi-asserted-by":"crossref","unstructured":"Jurcicek F Ga\u0161ic M Keizer S . Transformation-based learning for semantic parsing. Proceedings of Interspeech; 2009:2719\u201322.","DOI":"10.21437\/Interspeech.2009-695"},{"key":"2015062501525251000_20.5.931.16","unstructured":"Meystre SM Savova GK Kipper-Schuler KC . Extracting information from textual documents in the electronic health record: a review of recent research. Yearb Med Inform 2008;35:128\u201344."},{"key":"2015062501525251000_20.5.931.17","doi-asserted-by":"publisher","DOI":"10.1016\/S1532-0464(03)00012-1"},{"key":"2015062501525251000_20.5.931.18","doi-asserted-by":"crossref","unstructured":"Friedman C . Semantic text parsing for patient records. In: Chen H Fuller S Friedman C . Medical informatics: knowledge management and data mining in biomedicine. 1st edn. New York: Springer-Verlag, 2005:423\u201348.","DOI":"10.1007\/0-387-25739-X_15"},{"key":"2015062501525251000_20.5.931.19","doi-asserted-by":"crossref","unstructured":"Ceusters W Buekens F De Moor G . The distinction between linguistic and conceptual semantics in medical terminology and its implication for NLP-based knowledge acquisition. Methods Inf Med 1998;37:327\u201333.","DOI":"10.1055\/s-0038-1634568"},{"key":"2015062501525251000_20.5.931.20","unstructured":"Campbell DA Johnson SB . Comparing syntactic complexity in medical and non-medical corpora. Proceedings of AMIA Symposium; 2001:90\u20134."},{"key":"2015062501525251000_20.5.931.21","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2005.02.009"},{"key":"2015062501525251000_20.5.931.22","doi-asserted-by":"crossref","unstructured":"Manning C . Part-of-speech tagging from 97% to 100%: is it time for some linguistics? Proceedings of the 12th International Conference on Intelligent Text Processing and Computational Linguistics; 2011:171\u201389.","DOI":"10.1007\/978-3-642-19400-9_14"},{"key":"2015062501525251000_20.5.931.23","doi-asserted-by":"crossref","unstructured":"Toutanova K Manning CD . Enriching the knowledge sources used in a maximum entropy part-of-speech tagger. Joint Sigdat Conference on EMNLP\/VLC;2000:63\u201370.","DOI":"10.3115\/1117794.1117802"},{"key":"2015062501525251000_20.5.931.24","doi-asserted-by":"crossref","unstructured":"Toutanova K Klein D Manning CD . Feature-rich part-of-speech tagging with a cyclic dependency network. Proceedings of of HLT-NAACL; 2003:252\u20139.","DOI":"10.3115\/1073445.1073478"},{"key":"2015062501525251000_20.5.931.25","unstructured":"Shen L Satta G Joshi A . Guided learning for bidirectional sequence classification. Proceedings of ACL; 2007;45:760\u20137."},{"key":"2015062501525251000_20.5.931.26","unstructured":"S\u00f8gaard A . Simple semi-supervised training of part-of-speech taggers. Proceedings of ACL; 2010:205\u20138."},{"key":"2015062501525251000_20.5.931.27","unstructured":"Wikipedia: POS tagging (state of the art). http:\/\/aclweb.org\/aclwiki\/index.php?title=POS_Tagging_(State_of_the_art) (accessed 2 Apr 2012)."},{"key":"2015062501525251000_20.5.931.28","doi-asserted-by":"crossref","unstructured":"Marcus MP Marcinkiewicz MA Santorini B . Building a large annotated corpus of English: the Penn Treebank. Comput Linguist 1993;19:313\u201330.","DOI":"10.21236\/ADA273556"},{"key":"2015062501525251000_20.5.931.29","unstructured":"Baldridge J Morton T Bierner G . OpenNLP part-of-speech tagger. http:\/\/opennlp.apache.org\/ (accessed 2 Apr 2012)."},{"key":"2015062501525251000_20.5.931.30","unstructured":"Ratnaparkhi A . A maximum entropy model for part-of-speech tagging. Proceedings of EMNLP; 1996;1:133\u201342."},{"key":"2015062501525251000_20.5.931.31","unstructured":"Rizzolo N Roth D . Learning based java for rapid development of nlp systems. Proceedings of LREC; 2010:958\u201364."},{"key":"2015062501525251000_20.5.931.32","unstructured":"Roth D Zelenko D . Part of speech tagging using a network of linear separators. The 17th International Conference on Computational Linguistics; 1998;2:1136\u201342."},{"key":"2015062501525251000_20.5.931.33","doi-asserted-by":"crossref","unstructured":"Littlestone N . Learning quickly when irrelevant attributes abound: a new linear-threshold algorithm. Machine Learning 1988;2:285\u2013318.","DOI":"10.1007\/BF00116827"},{"key":"2015062501525251000_20.5.931.34","unstructured":"Littlestone N . Mistake bounds and logarithmic linear-threshold learning algorithms [PhD thesis]. Santa Cruz: University of California, 1990. Technical Report UCSC-CRL-89-11."},{"key":"2015062501525251000_20.5.931.35","unstructured":"LingPipe 4.1.0. http:\/\/alias-i.com\/lingpipe (accessed 2 Apr 2012)."},{"key":"2015062501525251000_20.5.931.36","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btg1023"},{"key":"2015062501525251000_20.5.931.37","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/bth227"},{"key":"2015062501525251000_20.5.931.38","doi-asserted-by":"crossref","unstructured":"Daum\u00e9 H III Marcu D . Learning as search optimization: approximate large margin methods for structured prediction. Proceedings of the 22nd international conference on Machine Learning; 2005:169\u201376.","DOI":"10.1145\/1102351.1102373"},{"key":"2015062501525251000_20.5.931.39","unstructured":"Daum\u00e9 H . Frustratingly easy domain adaptation. Proceedings of 45th Ann Meeting of the Assoc Computational Linguistics; 2007;45:256\u201363."},{"key":"2015062501525251000_20.5.931.40","unstructured":"Brill E . Transformation-based error-driven learning and natural language processing: a case study in part-of-speech tagging. Comput Linguist; 1995;21:543\u201365."},{"key":"2015062501525251000_20.5.931.41","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijmedinf.2005.08.006"},{"key":"2015062501525251000_20.5.931.42","doi-asserted-by":"crossref","unstructured":"Brants T . TnT: a statistical part-of-speech tagger. Proceedings of ANLP; 2000:224\u201331.","DOI":"10.3115\/974147.974178"},{"key":"2015062501525251000_20.5.931.43","doi-asserted-by":"publisher","DOI":"10.1136\/jamia.2009.001560"},{"key":"2015062501525251000_20.5.931.44","unstructured":"Fan J Prasad R Yabut RM . Part-of-speech tagging for clinical text: wall or bridge between institutions? AMIA Annual Symposium Proceedings 2011:382\u201391."},{"key":"2015062501525251000_20.5.931.45","doi-asserted-by":"publisher","DOI":"10.1197\/jamia.M2392"},{"key":"2015062501525251000_20.5.931.46","doi-asserted-by":"publisher","DOI":"10.1162\/0891201041850894"},{"key":"2015062501525251000_20.5.931.47","doi-asserted-by":"crossref","unstructured":"Blitzer J McDonald R Pereira F . Domain adaptation with structural correspondence learning. Proceedings of EMNLP; 2006:120\u20138.","DOI":"10.3115\/1610075.1610094"},{"key":"2015062501525251000_20.5.931.48","unstructured":"Santorini B . Part-of-speech tagging guidelines for the Penn Treebank project (3rd revision), Technical Report MS-CIS-90-47. University of Pennsylvania; 1990."},{"key":"2015062501525251000_20.5.931.49","doi-asserted-by":"crossref","unstructured":"Browne AC McCray AT Srinivasan S . The specialist lexicon. Bethesda, MD: Lister Hill National Center for Biomedical Communications, National Library of Medicine; 2000:18\u201321, NLM Technical Report NLM-LHC-93-01.","DOI":"10.1055\/s-0038-1637947"},{"key":"2015062501525251000_20.5.931.50","doi-asserted-by":"publisher","DOI":"10.1037\/h0031619"},{"key":"2015062501525251000_20.5.931.51","unstructured":"Biomedical Language Understanding (BLU) Lab\u2014University of Pittsburgh. Pittsburgh, PA; http:\/\/www.dbmi.pitt.edu\/blulab\/index.html (accessed 7 Jul 2012)."},{"key":"2015062501525251000_20.5.931.52","doi-asserted-by":"publisher","DOI":"10.1016\/0306-4573(91)90091-Y"},{"key":"2015062501525251000_20.5.931.53","unstructured":"Wood JM . Understanding and computing Cohen's kappa: a tutorial. WebPsychEmpiricist http:\/\/wpeinfo\/vault\/wood07\/Wood07pdf (accessed 2 Apr 2012)."},{"key":"2015062501525251000_20.5.931.54","unstructured":"World of computing. Articles on natural language processing: transformation based learning. http:\/\/language.worldofcomputing.net\/pos-tagging\/transformation-based-learning.html# (accessed 7 Jul 2012)."},{"key":"2015062501525251000_20.5.931.55","unstructured":"Brill E . Some advances in transformation-based part of speech tagging. Proceedings of the Twelfth National Conference on Artificial Intelligence (AAAI-94); 1994:722\u20137."},{"key":"2015062501525251000_20.5.931.56","doi-asserted-by":"crossref","unstructured":"Kneser R Ney H . Improved backing-off for m-gram language modeling. IEEE International Conference on Acoustics, Speech, and Signal Processing; 1995;1:181\u20134.","DOI":"10.1109\/ICASSP.1995.479394"},{"key":"2015062501525251000_20.5.931.57","doi-asserted-by":"publisher","DOI":"10.1162\/089120105775299159"},{"key":"2015062501525251000_20.5.931.58","doi-asserted-by":"crossref","unstructured":"Ngai G Florian R . Transformation-based learning in the fast lane. Proceedings of NAACL; 2001:40\u20137.","DOI":"10.3115\/1073336.1073342"},{"key":"2015062501525251000_20.5.931.59","doi-asserted-by":"crossref","unstructured":"Carberry S Vijay-Shanker K Wilson A . Randomized rule selection in transformation-based learning: a comparative study. Nat Lang Eng 2001;7:99\u2013116.","DOI":"10.1017\/S1351324901002662"}],"container-title":["Journal of the American Medical Informatics Association"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/jamia\/article-pdf\/20\/5\/931\/5876681\/20-5-931.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,2,11]],"date-time":"2022-02-11T11:40:31Z","timestamp":1644579631000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/jamia\/article-lookup\/doi\/10.1136\/amiajnl-2012-001453"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,9]]},"references-count":59,"journal-issue":{"issue":"5","published-online":{"date-parts":[[2013,9,1]]},"published-print":{"date-parts":[[2013,9]]}},"alternative-id":["10.1136\/amiajnl-2012-001453"],"URL":"https:\/\/doi.org\/10.1136\/amiajnl-2012-001453","relation":{},"ISSN":["1067-5027","1527-974X"],"issn-type":[{"value":"1067-5027","type":"print"},{"value":"1527-974X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,9]]}}}