{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T03:39:16Z","timestamp":1771299556223,"version":"3.50.1"},"reference-count":73,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,8,17]],"date-time":"2012-08-17T00:00:00Z","timestamp":1345161600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2012,12]]},"DOI":"10.1186\/1471-2105-13-207","type":"journal-article","created":{"date-parts":[[2012,8,17]],"date-time":"2012-08-17T12:14:47Z","timestamp":1345205687000},"source":"Crossref","is-referenced-by-count":62,"title":["A corpus of full-text journal articles is a robust evaluation tool for revealing differences in performance of biomedical natural language processing tools"],"prefix":"10.1186","volume":"13","author":[{"given":"Karin","family":"Verspoor","sequence":"first","affiliation":[]},{"given":"Kevin Bretonnel","family":"Cohen","sequence":"additional","affiliation":[]},{"given":"Arrick","family":"Lanfranchi","sequence":"additional","affiliation":[]},{"given":"Colin","family":"Warner","sequence":"additional","affiliation":[]},{"given":"Helen L","family":"Johnson","sequence":"additional","affiliation":[]},{"given":"Christophe","family":"Roeder","sequence":"additional","affiliation":[]},{"given":"Jinho D","family":"Choi","sequence":"additional","affiliation":[]},{"given":"Christopher","family":"Funk","sequence":"additional","affiliation":[]},{"given":"Yuriy","family":"Malenkiy","sequence":"additional","affiliation":[]},{"given":"Miriam","family":"Eckert","sequence":"additional","affiliation":[]},{"given":"Nianwen","family":"Xue","sequence":"additional","affiliation":[]},{"suffix":"Jr","given":"William A","family":"Baumgartner","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Bada","sequence":"additional","affiliation":[]},{"given":"Martha","family":"Palmer","sequence":"additional","affiliation":[]},{"given":"Lawrence E","family":"Hunter","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,8,17]]},"reference":[{"key":"5412_CR1","first-page":"147","volume-title":"Natural language processing and systems biology","author":"KB Cohen","year":"2004","unstructured":"Cohen KB, Hunter L: Natural language processing and systems biology.. Springer; 2004:147\u2013174 Springer; 2004:147\u2013174"},{"key":"5412_CR2","volume-title":"Proceedings of the Second BioCreative Challenge Evaluation Workshop","author":"M Krallinger","year":"2007","unstructured":"Krallinger M, Leitner F, Valencia A: Assessment of the second BioCreative PPI task: automatic extraction of protein-protein interactions. Proceedings of the Second BioCreative Challenge Evaluation Workshop 2007."},{"issue":"6","key":"5412_CR3","doi-asserted-by":"publisher","first-page":"e1000534","DOI":"10.1371\/journal.pgen.1000534","volume":"5","author":"S Raychaudhuri","year":"2009","unstructured":"Raychaudhuri S, Plenge RM, Rossin EJ, Ng ACY, Purcell SM, Sklar P, Scolnick EM, Xavier RJ, Altshuler D, Daly MJ: Identifying relationships among genomic disease regions: predicting genes at pathogenic SNP associations and rare deletions. PLoS Genet 2009, 5(6):e1000534. 10.1371\/journal.pgen.1000534","journal-title":"PLoS Genet"},{"key":"5412_CR4","doi-asserted-by":"crossref","unstructured":"Cohen KB, Johnson HL, Verspoor K, Roeder C, Hunter L: The structural and content aspects of abstracts versus bodies of full text journal articles are different. BMC Bioinf 2010., 11(492): [doi:10.1186\/1471\u20132105\u201311\u2013492] [doi:10.1186\/1471-2105-11-492]","DOI":"10.1186\/1471-2105-11-492"},{"key":"5412_CR5","doi-asserted-by":"crossref","unstructured":"Clegg A, Shepherd A: Benchmarking natural-language parsers for biological applications using dependency graphs. BMC Bioinf 2007., 8(24): [doi:10.1186\/1471\u20132105\u20138-24] [doi:10.1186\/1471-2105-8-24]","DOI":"10.1186\/1471-2105-8-24"},{"key":"5412_CR6","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1186\/1471-2105-10-183","volume":"10","author":"K Verspoor","year":"2009","unstructured":"Verspoor K, Cohen KB, Hunter L: The textual characteristics of traditional and Open Access scientific journals are similar. BMC Bioinf 2009, 10: 183. [doi:10.1186\/1471\u20132105\u201310\u2013183] [doi:10.1186\/1471-2105-10-183] 10.1186\/1471-2105-10-183","journal-title":"BMC Bioinf"},{"issue":"4","key":"5412_CR7","doi-asserted-by":"publisher","first-page":"196","DOI":"10.1002\/cfg.91","volume":"2","author":"C Blaschke","year":"2001","unstructured":"Blaschke C, Valencia A: Can bibliographic pointers for known biological data be found automatically? Protein interactions as a case study. Comp Funct Genomics 2001, 2(4):196\u2013206. 10.1002\/cfg.91","journal-title":"Comp Funct Genomics"},{"key":"5412_CR8","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1186\/1471-2105-4-20","volume":"4","author":"PK Shah","year":"2003","unstructured":"Shah PK, Perez-Iratxeta C, Bork P, Andrade MA: Information extraction from full text scientific articles: where are the keywords? BMC Bioinf 2003, 4: 20. [doi:10.1186\/1471\u20132105\u20134-20] [doi:10.1186\/1471-2105-4-20] 10.1186\/1471-2105-4-20","journal-title":"BMC Bioinf"},{"issue":"17","key":"5412_CR9","doi-asserted-by":"publisher","first-page":"3206","DOI":"10.1093\/bioinformatics\/bth386","volume":"20","author":"DP Corney","year":"2004","unstructured":"Corney DP, Buxton BF, Langdon WB, Jones DT: BioRAT: extracting biological information from full-length papers. Bioinformatics 2004, 20(17):3206\u20133213. 10.1093\/bioinformatics\/bth386","journal-title":"Bioinformatics"},{"issue":"Suppl 1","key":"5412_CR10","doi-asserted-by":"publisher","first-page":"S74","DOI":"10.1093\/bioinformatics\/17.suppl_1.S74","volume":"17","author":"C Friedman","year":"2001","unstructured":"Friedman C, Kra P, Yu H, Krauthammer M, Rzhetsky A: GENIES: a natural-language processing system for the extraction of molecular pathways from journal articles. Bioinformatics 2001, 17(Suppl 1):S74-S82. 10.1093\/bioinformatics\/17.suppl_1.S74","journal-title":"Bioinformatics"},{"issue":"8","key":"5412_CR11","doi-asserted-by":"publisher","first-page":"1124","DOI":"10.1093\/bioinformatics\/18.8.1124","volume":"18","author":"L Tanabe","year":"2002","unstructured":"Tanabe L, Wilbur WJ: Tagging gene and protein names in biomedical text. Bioinformatics 2002, 18(8):1124\u20131132. 10.1093\/bioinformatics\/18.8.1124","journal-title":"Bioinformatics"},{"key":"5412_CR12","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.jbi.2003.10.001","volume":"37","author":"A Rzhetsky","year":"2004","unstructured":"Rzhetsky A, Iossifov I, Koike T, Krauthammer M, Kra P, Morris M, Yu H, Duboue PA, Weng W, Wilbur WJ, Hatzivassiloglou V, Friedman C: GeneWays: a system for extracting, analyzing, visualizing, and integrating molecular pathway data. J Biomed Inf 2004, 37: 43\u201353. 10.1016\/j.jbi.2003.10.001","journal-title":"J Biomed Inf"},{"key":"5412_CR13","volume-title":"Proceedings of BioCreative III","year":"2010","unstructured":"Arighi C, Cohen K, Hirschman L, Krallinger M, Lu Z, Valencia A, Wilbur J, Wu C (Eds): 2010. Proceedings of BioCreative III"},{"key":"5412_CR14","unstructured":"Bada M, Eckert M, Evans D, Garcia K, Shipley K, Sitnikov D, Baumgartner Jr WA, Cohen KB, Verspoor K, Blake JA, Hunter LE: Concept Annotation in the CRAFT Corpus. [\n                    http:\/\/www.biomedcentral.com\/1471\u20132105\/13\/161\n                    \n                  ] []"},{"key":"5412_CR15","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1197\/jamia.M2233","volume":"14","author":"NC Ide","year":"2007","unstructured":"Ide NC, Loane RF, Demner-Fushman D: Essie: A concept-based search engine for structured biomedical text. J Am Med Inf Assoc 2007, 14: 253\u2013263. 10.1197\/jamia.M2233","journal-title":"J Am Med Inf Assoc"},{"issue":"3","key":"5412_CR16","doi-asserted-by":"publisher","first-page":"394","DOI":"10.1093\/bioinformatics\/btn631","volume":"25","author":"Y Miyao","year":"2009","unstructured":"Miyao Y, Sagae K, Saetre R, Matsuzaki T, Tsujii J: Evaluating contributions of natural language parsers to protein-protein interaction extraction. Bioinformatics 2009, 25(3):394\u2013400. 10.1093\/bioinformatics\/btn631","journal-title":"Bioinformatics"},{"key":"5412_CR17","first-page":"1","volume-title":"BioNLP 2009 Companion Volume: Shared Task on Entity Extraction","author":"JD Kim","year":"2009","unstructured":"Kim JD, Ohta T, Pyysalo S, Kano Y, Tsujii J: Overview of BioNLP\u201909 shared task on event extraction. BioNLP 2009 Companion Volume: Shared Task on Entity Extraction 2009, 1\u20139."},{"key":"5412_CR18","first-page":"1","volume":"1","author":"C Grover","year":"2003","unstructured":"Grover C, Lapata M, Lascarides A: A comparison of parsing techniques for the biomedical domain. Nat Language Eng 2003, 1: 1\u201338.","journal-title":"Nat Language Eng"},{"issue":"6","key":"5412_CR19","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1016\/j.ijmedinf.2005.06.009","volume":"75","author":"S Pyysalo","year":"2006","unstructured":"Pyysalo S, Ginter F, Pahikkala T, Boberg J, J\u00e4rvinen J, Salakoski T: Evaluation of two dependency parsers on biomedical corpus targeted at protein-protein interactions. Int J Med Inf 2006, 75(6):430\u2013442. 10.1016\/j.ijmedinf.2005.06.009","journal-title":"Int J Med Inf"},{"key":"5412_CR20","first-page":"137","volume-title":"Third Workshop on Treebanks and Linguistic Theories (TLT) 2004","author":"G Schneider","year":"2004","unstructured":"Schneider G, Rinaldi F, Kaljurand K, Hess M: Steps towards a GENIA dependency treebank. Third Workshop on Treebanks and Linguistic Theories (TLT) 2004 2004, 137\u2013149."},{"key":"5412_CR21","volume-title":"Proceedings of the Human Language Technology conference","author":"T Ohta","year":"2002","unstructured":"Ohta T, Tateisi Y, Kim JD, Mima H, ichi Tsujii J: The GENIA corpus: an annotated corpus in molecular biology. Proceedings of the Human Language Technology conference 2002."},{"issue":"Suppl 1","key":"5412_CR22","doi-asserted-by":"publisher","first-page":"180","DOI":"10.1093\/bioinformatics\/btg1023","volume":"19","author":"JD Kim","year":"2003","unstructured":"Kim JD, Ohta T, Tateisi Y, Tsujii J: GENIA corpus\u2014a semantically annotated corpus for bio-textmining. Bioinformatics 2003, 19(Suppl 1):180\u2013182. 10.1093\/bioinformatics\/btg1023","journal-title":"Bioinformatics"},{"key":"5412_CR23","doi-asserted-by":"publisher","first-page":"38","DOI":"10.3115\/1641484.1641490","volume-title":"Proceedings of the ACL-ISMB workshop on linking biological literature, ontologies and databases","author":"KB Cohen","year":"2005","unstructured":"Cohen KB, Fox L, Ogren PV, Hunter L: Corpus design for biomedical natural language processing. In Proceedings of the ACL-ISMB workshop on linking biological literature, ontologies and databases. Association for Computational Linguistics, Detroit; 2005:38\u201345."},{"key":"5412_CR24","first-page":"156","volume-title":"AMIA 2005 symposium proceedings","author":"KB Cohen","year":"2005","unstructured":"Cohen KB, Fox L, Ogren PV, Hunter L: Empirical data on corpus design and usage in biomedical natural language processing. AMIA 2005 symposium proceedings 2005, 156\u2013160."},{"issue":"Suppl 1","key":"5412_CR25","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/1471-2105-6-S1-S3","volume":"6","author":"L Tanabe","year":"2005","unstructured":"Tanabe L, Xie N, Thom L, Matten W, Wilbur W: GENETAG: a tagged corpus for gene\/protein named entity recognition. BMC Bioinf 2005, 6(Suppl 1):S3. 10.1186\/1471-2105-6-S1-S3","journal-title":"BMC Bioinf"},{"key":"5412_CR26","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1186\/1471-2105-8-50","volume":"8","author":"S Pyysalo","year":"2007","unstructured":"Pyysalo S, Ginter F, Heimonen J, Bjorne J, Boberg J, Jarvinen J, Salakoski T: BioInfer: a corpus for information extraction in the biomedical domain. BMC Bioinf 2007, 8: 50. 10.1186\/1471-2105-8-50","journal-title":"BMC Bioinf"},{"key":"5412_CR27","doi-asserted-by":"publisher","first-page":"38","DOI":"10.3115\/1572306.1572314","volume-title":"Proceedings of the Workshop on Current Trends in Biomedical Natural Language Processing","author":"G Szarvas","year":"2008","unstructured":"Szarvas G, Vincze V, Farkas R, Csirik J: The BioScope corpus: annotation for negation, uncertainty and their scope in biomedical texts. In Proceedings of the Workshop on Current Trends in Biomedical Natural Language Processing. Association for Computational Linguistics, Columbus, Ohio; 2008:38\u201345. [\n                    http:\/\/www.aclweb.org\/anthology\/W\/W08\/W08\u20130606\n                    \n                  ] []"},{"key":"5412_CR28","first-page":"1","volume-title":"Proceedings of BioNLP Shared Task 2011 Workshop","author":"JD Kim","year":"2011","unstructured":"Kim JD, Pyysalo S, Ohta T, Bossy R, Nguyen N, Tsujii J: Overview of BioNLP Shared Task 2011. In Proceedings of BioNLP Shared Task 2011 Workshop. Association for Computational Linguistics, Portland, Oregon, USA; 2011:1\u20136. [\n                    http:\/\/www.aclweb.org\/anthology\/W11\u20131801\n                    \n                  ] []"},{"key":"5412_CR29","volume-title":"Part-of-Speech Tagging Guidelines for the Penn Treebank Project, 3rd revision","author":"B Santorini","year":"1990","unstructured":"Santorini B: Part-of-Speech Tagging Guidelines for the Penn Treebank Project, 3rd revision. 1990.\n                    http:\/\/repository.upenn.edu\/cis reports\/570\/\n                    \n                   []"},{"key":"5412_CR30","volume-title":"Bracketing Guidelines for Treebank II style","author":"A Bies","year":"1995","unstructured":"Bies A, Ferguson M, Katz K, MacIntyre R: Bracketing Guidelines for Treebank II style. 1995. [\n                    ftp:\/\/ftp.cis.upenn.edu\/pub\/treebank\/doc\/manual\/root.ps.gz\n                    \n                  ] []"},{"key":"5412_CR31","volume-title":"Supplementary Guidelines for English Translation Treebank 2.0","author":"J Mott","year":"2009","unstructured":"Mott J, Warner C, Bies A, Taylor A: Supplementary Guidelines for English Translation Treebank 2.0. 2009.\n                    projects.ldc.upenn.edu\/gale\/task specifications\/ettb guidelines.pdf\n                    \n                   []"},{"key":"5412_CR32","volume-title":"Reconciliation of Differences Between Onto\/WSJ and EXTB","author":"A Taylor","year":"2010","unstructured":"Taylor A: Reconciliation of Differences Between Onto\/WSJ and EXTB. 2010."},{"key":"5412_CR33","volume-title":"Treebank 2a guidelines","author":"A Taylor","year":"2006","unstructured":"Taylor A: Treebank 2a guidelines. 2006.\n                    http:\/\/www-users.york.ac.uk\/lang22\/TB2a Guidelines.htm\n                    \n                   []"},{"key":"5412_CR34","volume-title":"Addendum to the Penn Treebank II Style Bracketing Guidelines: Biomedical Treebank Annotation","author":"C Warner","year":"2004","unstructured":"Warner C, Bies A, Brisson C, Mott J: Addendum to the Penn Treebank II Style Bracketing Guidelines: Biomedical Treebank Annotation. 2004."},{"key":"5412_CR35","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/9780262013055.001.0001","volume-title":"The Processes of Life: An Introduction to Molecular Biology","author":"LE Hunter","year":"2009","unstructured":"Hunter LE: The Processes of Life: An Introduction to Molecular Biology. MIT Press, Cambridge, MA; 2009."},{"key":"5412_CR36","first-page":"693","volume-title":"Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies","author":"S Kulick","year":"2011","unstructured":"Kulick S, Bies A, Mott J: Using derivation trees for Treebank error detection. In Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies. Association for Computational Linguistics, Portland, Oregon, USA; 2011:693\u2013698."},{"issue":"5","key":"5412_CR37","doi-asserted-by":"publisher","first-page":"r44","DOI":"10.1186\/gb-2005-6-5-r44","volume":"6","author":"K Eilbeck","year":"2005","unstructured":"Eilbeck K, Lewis SE, Mungall CJ, Yandell M, Stein L, Durbin R, Ashburner M: The Sequence Ontology: a tool for the unification of genome annotations. Genome Biol 2005, 6(5):r44. [doi:10.1186\/gb-2005\u20136-5-r44] [doi:10.1186\/gb-2005-6-5-r44] 10.1186\/gb-2005-6-5-r44","journal-title":"Genome Biol"},{"issue":"Suppl 1","key":"5412_CR38","doi-asserted-by":"publisher","first-page":"D52","DOI":"10.1093\/nar\/gkq1237","volume":"39","author":"D Maglott","year":"2011","unstructured":"Maglott D, Ostell J, Pruitt KD, Tatusova T: Entrez Gene: gene-centered information at NCBI. Nucleic Acids Res 2011, 39(Suppl 1):D52-D57. [\n                    http:\/\/nar.oxfordjournals.org\/content\/39\/suppl1\/D52.abstract\n                    \n                  ] []","journal-title":"Nucleic Acids Res"},{"issue":"Suppl 1","key":"5412_CR39","doi-asserted-by":"publisher","first-page":"D38","DOI":"10.1093\/nar\/gkq1172","volume":"39","author":"EW Sayers","year":"2011","unstructured":"Sayers EW, Barrett T, Benson DA, Bolton E, Bryant SH, Canese K, Chetvernin V, Church DM, DiCuccio M, Federhen S, Feolo M, Fingerman IM, Geer LY, Helmberg W, Kapustin Y, Landsman D, Lipman DJ, Lu Z, Madden TL, Madej T, Maglott DR, Marchler-Bauer A, Miller V, Mizrachi I, Ostell J, Panchenko A, Phan L, Pruitt KD, Schuler GD, Sequeira E, Sherry ST, Shumway M, Sirotkin K, Slotta D, Souvorov A, Starchenko G, Tatusova TA, Wagner L, Wang Y, Wilbur WJ, Yaschenko E, Ye J: Database resources of the National Center for Biotechnology Information. Nucleic Acids Res 2011, 39(Suppl 1):D38-D51. [\n                    http:\/\/nar.oxfordjournals.org\/content\/39\/suppl1\/D38.abstract\n                    \n                  ] []","journal-title":"Nucleic Acids Res"},{"issue":"Suppl 2","key":"5412_CR40","doi-asserted-by":"publisher","first-page":"S2","DOI":"10.1186\/gb-2008-9-s2-s2","volume":"9","author":"L Smith","year":"2008","unstructured":"Smith L, Tanabe L, Johnson nee Ando R, Kuo CJ, Chung IF, Hsu CN, Lin YS, Klinger R, Friedrich C, Ganchev K, Torii M, Liu H, Haddow B, Struble C, Povinelli R, Vlachos A, Baumgartner Jr W, Hunter L, Carpenter B, Tsai RTH, Dai HJ, Liu F, Chen Y, Sun C, Katrenko S, Adriaans P, Blaschke C, Perez RT, Neves M, Nakov P, Divoli A, Mana M, Mata-Vazquez J, Wilber J: Overview of BioCreative II gene mention recognition. Genome Biol 2008, 9(Suppl 2):S2. 10.1186\/gb-2008-9-s2-s2","journal-title":"Genome Biol"},{"issue":"Suppl 2","key":"5412_CR41","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/gb-2008-9-s2-s3","volume":"9","author":"AA Morgan","year":"2008","unstructured":"Morgan AA, Cohen KB, Hirschman L, et al.: Overview of BioCreative II gene normalization. Genome Biol 2008, 9(Suppl 2):S3. 10.1186\/gb-2008-9-s2-s3","journal-title":"Genome Biol"},{"key":"5412_CR42","doi-asserted-by":"crossref","unstructured":"Yeh A, Morgan A, Colosimo M, Hirschman L: BioCreative task 1A: gene mention finding evaluation. BMC Bioinf 2005., 6(Suppl 1):","DOI":"10.1186\/1471-2105-6-S1-S2"},{"key":"5412_CR43","doi-asserted-by":"publisher","first-page":"70","DOI":"10.3115\/1567594.1567610","volume-title":"Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and its Applications (NLPBA)","author":"JD Kim","year":"2004","unstructured":"Kim JD, Ohta T, Tsuruoka Y, Tateisi Y, Collier N: Introduction to the bio-entity recognition task at JNLPBA. Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and its Applications (NLPBA) 2004, 70\u201375."},{"issue":"5","key":"5412_CR44","doi-asserted-by":"publisher","first-page":"901","DOI":"10.1142\/S0219720010004999","volume":"8","author":"Y Wang","year":"2010","unstructured":"Wang Y, Kim JD, Saetre R, Pyysalo S, Ohta T, Tsujii J: Improving the inter-corpora compatibility for protein annotations. J Bioinf Comput Biol 2010, 8(5):901\u2013916. 10.1142\/S0219720010004999","journal-title":"J Bioinf Comput Biol"},{"key":"5412_CR45","first-page":"3","volume":"15","author":"D Klein","year":"2003","unstructured":"Klein D, Manning C: Fast exact inference with a factored model for natural language parsing. Adv Neural Inf Process Syst 2003, 15: 3\u201310.","journal-title":"Adv Neural Inf Process Syst"},{"key":"5412_CR46","doi-asserted-by":"publisher","first-page":"152","DOI":"10.3115\/1220835.1220855","volume-title":"Proceedings of Human Language Technology Conference of the North American Chapter of the Association of Computational Linguistics","author":"D McClosky","year":"2006","unstructured":"McClosky D, Charniak E, Johnson M: Effective self-training for parsing. In Proceedings of Human Language Technology Conference of the North American Chapter of the Association of Computational Linguistics. Association for Computational Linguistics, Brooklyn, NY; 2006:152\u2013159."},{"key":"5412_CR47","volume-title":"Proceedings of the 7th International Conference on Language Resources and Evaluation (LREC\u201910)","author":"D Cer","year":"2010","unstructured":"Cer D, de Marneffe MC, Jurafsky D, Manning CD: Parsing to Stanford Dependencies: Trade-offs between speed and accuracy. Proceedings of the 7th International Conference on Language Resources and Evaluation (LREC\u201910) 2010."},{"key":"5412_CR48","volume-title":"Proceedings of the First International Conference on Human Language Technology Research","author":"M Banko","year":"2001","unstructured":"Banko M, Brill E: Mitigating the paucity-of-data problem: exploring the effect of training corpus size on classifier performance for natural language processing. Proceedings of the First International Conference on Human Language Technology Research 2001."},{"key":"5412_CR49","first-page":"37","volume-title":"BioTxtM 2010: 2nd Workshop on Building and Evaluating Resources for Biomedical Text Mining","author":"KB Cohen","year":"2010","unstructured":"Cohen KB, Lanfranchi A, Corvey W, Jr WAB, Roeder C, Ogren PV, Palmer M, Hunter LE: Annotation of all coreference in biomedical text: Guideline selection and adaptation. BioTxtM 2010: 2nd Workshop on Building and Evaluating Resources for Biomedical Text Mining 2010, 37\u201341."},{"key":"5412_CR50","volume-title":"Proceedings of the American Medical Informatics Association Fall Symposium","author":"KB Cohen","year":"2011","unstructured":"Cohen KB, Christiansen T, Hunter LE: Parenthetically speaking: Classifying the contents of parentheses for text mining. Proceedings of the American Medical Informatics Association Fall Symposium 2011."},{"key":"5412_CR51","unstructured":"PubMed Central Open Access Collection [\n                    http:\/\/www.ncbi.nlm.nih.gov\/pmc\/about\/openftlist.html\n                    \n                  ] []"},{"key":"5412_CR52","volume-title":"The Evalb software","author":"S Sekine","year":"1997","unstructured":"Sekine S, Collins MJ: The Evalb software. 1997.\n                    http:\/\/cs.nyu.edu\/cs\/projects\/proteus\/evalb\n                    \n                   []"},{"key":"5412_CR53","first-page":"1","volume-title":"Proceedings of the Workshop on Software Engineering, Testing, and Quality Assurance for Natural Language Processing (SETQA-NLP 2009)","author":"P Ogren","year":"2009","unstructured":"Ogren P, Bethard S: Building Test Suites for UIMA Components. In Proceedings of the Workshop on Software Engineering, Testing, and Quality Assurance for Natural Language Processing (SETQA-NLP 2009). Association for Computational Linguistics, Boulder, Colorado; 2009:1\u20134."},{"key":"5412_CR54","volume-title":"HLT-NAACL 2006 Companion Volume","author":"P Ogren","year":"2006a","unstructured":"Ogren P: Knowtator: a Protege plugin for annotated corpus construction. HLT-NAACL 2006 Companion Volume 2006a."},{"key":"5412_CR55","first-page":"17","volume-title":"The knowledge model of Protege-2000: Combining interoperability and flexibility","author":"N Noy","year":"2000","unstructured":"Noy N, Fridman N, Fergerson Ray W, Musen M, Mark A: The knowledge model of Protege-2000: Combining interoperability and flexibility. Springer-Verlag, London, UK, UK; 2000:17\u201332."},{"issue":"14","key":"5412_CR56","doi-asserted-by":"publisher","first-page":"3191","DOI":"10.1093\/bioinformatics\/bti475","volume":"21","author":"B Settles","year":"2005","unstructured":"Settles B: ABNER: an open source tool for automatically tagging genes, proteins, and other entity names in text. Bioinformatics 2005, 21(14):3191\u20133192. [\n                    http:\/\/dx.doi.org\/doi:10.1093\/bioinformatics\/bti475\n                    \n                  ] [] 10.1093\/bioinformatics\/bti475","journal-title":"Bioinformatics"},{"key":"5412_CR57","volume-title":"Pac Symp Biocomput","author":"R Leaman","year":"2008","unstructured":"Leaman R, Gonzalez G: BANNER: An executable survey of advances in biomedical named entity recognition. Pac Symp Biocomput 2008."},{"key":"5412_CR58","volume-title":"Phrasal Queries with LingPipe and Lucene","author":"B Carpenter","year":"2004","unstructured":"Carpenter B: Phrasal Queries with LingPipe and Lucene. 2004."},{"key":"5412_CR59","first-page":"249","volume-title":"Von der Form aur Bedeutung: Text automatisch verarbeiten \/ From Form to Meaning: Processing Texts Automatically","author":"K Verspoor","year":"2009","unstructured":"Verspoor K, Baumgartner W, Roeder C, Hunter L: Abstracting the Types away from a UIMA Type System. In Von der Form aur Bedeutung: Text automatisch verarbeiten \/From Form to Meaning: Processing Texts Automatically Edited by: Chiarcos C, Eckhart de Castilho R, Stede M. 2009, 249\u2013256."},{"key":"5412_CR60","volume-title":"The opennlp maximum entropy package","author":"J Baldridge","year":"2002","unstructured":"Baldridge J, Morton T, Bierner G: The opennlp maximum entropy package. 2002. Technical report, SourceForge"},{"issue":"3","key":"5412_CR61","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1147\/sj.433.0455","volume":"43","author":"D Ferrucci","year":"2004","unstructured":"Ferrucci D, Lally A: Building an example application with the unstructured information management architecture. IBM Syst J 2004, 43(3):455\u2013475.","journal-title":"IBM Syst J"},{"issue":"2","key":"5412_CR62","first-page":"313","volume":"19","author":"MP Marcus","year":"1993","unstructured":"Marcus MP, Marcinkiewicz MA, Santorini B: Building a large annotated corpus of English: the Penn Treebank. Comput Linguistics 1993, 19(2):313\u2013330.","journal-title":"Comput Linguistics"},{"key":"5412_CR63","unstructured":"Apache UIMA ConceptMapper Annotator Documentation 2009. Tech. rep., The Apache Software Foundation"},{"key":"5412_CR64","first-page":"433","volume-title":"Proceedings of the 21st International Conference on Computational Linguistics and the 44th annual meeting of the Association for Computational Linguistics","author":"S Petrov","year":"2006","unstructured":"Petrov S, Barrett L, Thibaux R, Klein D: Learning accurate, compact, and interpretable tree annotation. In Proceedings of the 21st International Conference on Computational Linguistics and the 44th annual meeting of the Association for Computational Linguistics. Association for Computational Linguistics, Sydney; 2006:433\u2013440."},{"key":"5412_CR65","first-page":"182","volume-title":"Proc. of EMNLP, Volume 4","author":"D Bikel","year":"2004","unstructured":"Bikel D: A distributional analysis of a lexicalized statistical parsing model. Proc. of EMNLP, Volume 4 2004, 182\u2013189."},{"key":"5412_CR66","first-page":"58","volume-title":"Second International Joint Conference on Natural Language Processing","author":"M Lease","year":"2005","unstructured":"Lease M, Charniak E: Parsing biomedical literature. Second International Joint Conference on Natural Language Processing 2005, 58\u201369."},{"key":"5412_CR67","first-page":"155","volume-title":"Proceedings of the 2006 Conference on Empirical Methods in Natural Language Processing","author":"T Ninomiya","year":"2006","unstructured":"Ninomiya T, Matsuzaki T, Tsuruoka Y, Miyao Y, Tsujii J: Extremely lexicalized models for accurate and fast HPSG parsing. In Proceedings of the 2006 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics, Sydney; 2006:155\u2013163."},{"key":"5412_CR68","volume-title":"Any Domain Parsing: Automatic Domain Adaptation for Natural Language Parsing","author":"D McClosky","year":"2009","unstructured":"McClosky D: Any Domain Parsing: Automatic Domain Adaptation for Natural Language Parsing. 2009. PhD thesis. Brown University, Department of Computer Science"},{"key":"5412_CR69","first-page":"351","volume-title":"Proceedings of the Joint Conference of the 47th Annual Meeting of the ACL and the 4th International Joint Conference on Natural Language Processing of the AFNLP (ACL-IJCNLP\u201909)","author":"J Nivre","year":"2009","unstructured":"Nivre J: Non-projective dependency parsing in expected linear time. Proceedings of the Joint Conference of the 47th Annual Meeting of the ACL and the 4th International Joint Conference on Natural Language Processing of the AFNLP (ACL-IJCNLP\u201909) 2009, 351\u2013359."},{"key":"5412_CR70","doi-asserted-by":"publisher","first-page":"523","DOI":"10.3115\/1220575.1220641","volume-title":"Proceedings of the Conference on Human Language Technology and Empirical Methods in Natural Language Processing (HLT-EMNLP\u201905)","author":"R McDonald","year":"2005","unstructured":"McDonald R, Pereira F, Ribarov K, Hajic J: Non-projective dependency parsing using spanning tree algorithms. Proceedings of the Conference on Human Language Technology and Empirical Methods in Natural Language Processing (HLT-EMNLP\u201905) 2005, 523\u2013530."},{"key":"5412_CR71","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1075\/cilt.309.16cho","volume-title":"Collections of Recent Advances in Natural Language Processing V","author":"JD Choi","year":"2009","unstructured":"Choi JD, Nicolov N: K-best, Locally Pruned, Transition-based Dependency Parsing Using Robust Risk Minimization. In Collections of Recent Advances in Natural Language Processing V. John Benjamins; 2009:205\u2013216."},{"key":"5412_CR72","first-page":"55","volume-title":"Proceedings of the 9th International Workshop on Treebanks and Linguistic Theories (TLT\u20199)","author":"JD Choi","year":"2010","unstructured":"Choi JD, Palmer M: Robust Constituent-to-Dependency Conversion for English. Proceedings of the 9th International Workshop on Treebanks and Linguistic Theories (TLT\u20199) 2010, 55\u201366."},{"key":"5412_CR73","volume-title":"Proceedings of the 16th Nordic Conference of Computational Linguistics (NODALIDA\u201907)","author":"R Johansson","year":"2007","unstructured":"Johansson R, Nugues P: Extended constituent-to-dependency conversion for English. In Proceedings of the 16th Nordic Conference of Computational Linguistics (NODALIDA\u201907). Tartu; 2007. [\n                    http:\/\/dspace.utlib.ee\/dspace\/handle\/10062\/2560\n                    \n                  ] []"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-13-207.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-13-207\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-13-207.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,2,17]],"date-time":"2020-02-17T19:14:07Z","timestamp":1581966847000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-13-207"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,8,17]]},"references-count":73,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,12]]}},"alternative-id":["5412"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-13-207","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,8,17]]},"article-number":"207"}}