{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T16:09:03Z","timestamp":1774627743783,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"1","funder":[{"DOI":"10.13039\/100005156","name":"Alexander von Humboldt-Stiftung","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100005156","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004191","name":"Novo Nordisk","doi-asserted-by":"publisher","award":["NNF14CC0001"],"award-info":[{"award-number":["NNF14CC0001"]}],"id":[{"id":"10.13039\/501100004191","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1186\/s12859-018-2021-9","type":"journal-article","created":{"date-parts":[[2018,1,17]],"date-time":"2018-01-17T12:21:51Z","timestamp":1516191711000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":138,"title":["LocText: relation extraction of protein localizations to assist database curation"],"prefix":"10.1186","volume":"19","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9588-984X","authenticated-orcid":false,"given":"Juan Miguel","family":"Cejuela","sequence":"first","affiliation":[]},{"given":"Shrikant","family":"Vinchurkar","sequence":"additional","affiliation":[]},{"given":"Tatyana","family":"Goldberg","sequence":"additional","affiliation":[]},{"given":"Madhukar Sollepura","family":"Prabhu Shankar","sequence":"additional","affiliation":[]},{"given":"Ashish","family":"Baghudana","sequence":"additional","affiliation":[]},{"given":"Aleksandar","family":"Bojchevski","sequence":"additional","affiliation":[]},{"given":"Carsten","family":"Uhlig","sequence":"additional","affiliation":[]},{"given":"Andr\u00e9","family":"Ofner","sequence":"additional","affiliation":[]},{"given":"Pandu","family":"Raharja-Liu","sequence":"additional","affiliation":[]},{"given":"Lars Juhl","family":"Jensen","sequence":"additional","affiliation":[]},{"given":"Burkhard","family":"Rost","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,1,17]]},"reference":[{"issue":"1","key":"2021_CR1","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"M Ashburner","year":"2000","unstructured":"Ashburner M, Ball CA, Blake JA, Botstein D, Butler H, Cherry JM, Davis AP, Dolinski K, Dwight SS, Eppig JT, Harris MA, Hill DP, Issel-Tarver L, Kasarskis A, Lewis S, Matese JC, Richardson JE, Ringwald M, Rubin GM, Sherlock G. Gene ontology: tool for the unification of biology. the gene ontology consortium. Nat Genet. 2000; 25(1):25\u20139. https:\/\/doi.org\/10.1038\/75556 .","journal-title":"Nat Genet"},{"issue":"6","key":"2021_CR2","doi-asserted-by":"crossref","first-page":"843","DOI":"10.1093\/bioinformatics\/btw723","volume":"33","author":"H Zhou","year":"2017","unstructured":"Zhou H, Yang Y, Shen HB. Hum-mPLoc 3.0: prediction enhancement of human protein subcellular localization through modeling the hidden correlations of gene ontology and functional domain features. Bioinformatics. 2017; 33(6):843\u201353. https:\/\/doi.org\/10.1093\/bioinformatics\/btw723 .","journal-title":"Bioinformatics"},{"issue":"Web Server issu","key":"2021_CR3","doi-asserted-by":"publisher","first-page":"585","DOI":"10.1093\/nar\/gkm259","volume":"35","author":"P Horton","year":"2007","unstructured":"Horton P, Park KJ, Obayashi T, Fujita N, Harada H, Adams-Collier CJ, Nakai K. WoLF PSORT: protein localization predictor. Nucleic Acids Res. 2007; 35(Web Server issue):585\u20137. https:\/\/doi.org\/10.1093\/nar\/gkm259 .","journal-title":"Nucleic Acids Res"},{"issue":"10","key":"2021_CR4","doi-asserted-by":"publisher","first-page":"785","DOI":"10.1038\/nmeth.1701","volume":"8","author":"TN Petersen","year":"2011","unstructured":"Petersen TN, Brunak S, von Heijne G, Nielsen H. SignalP 4.0: discriminating signal peptides from transmembrane regions. Nat Methods. 2011; 8(10):785\u20136. https:\/\/doi.org\/10.1038\/nmeth.1701 .","journal-title":"Nat Methods"},{"issue":"3","key":"2021_CR5","doi-asserted-by":"publisher","first-page":"643","DOI":"10.1002\/prot.21018","volume":"64","author":"CS Yu","year":"2006","unstructured":"Yu CS, Chen YC, Lu CH, Hwang JK. Prediction of protein subcellular localization. Proteins. 2006; 64(3):643\u201351. https:\/\/doi.org\/10.1002\/prot.21018 .","journal-title":"Proteins"},{"issue":"Web Server issu","key":"2021_CR6","doi-asserted-by":"publisher","first-page":"497","DOI":"10.1093\/nar\/gkq477","volume":"38","author":"S Briesemeister","year":"2010","unstructured":"Briesemeister S, Rahnenfuhrer J, Kohlbacher O. YLoc\u2013an interpretable web server for predicting subcellular localization. Nucleic Acids Res. 2010; 38(Web Server issue):497\u2013502. https:\/\/doi.org\/10.1093\/nar\/gkq477 .","journal-title":"Nucleic Acids Res"},{"issue":"13","key":"2021_CR7","doi-asserted-by":"publisher","first-page":"1608","DOI":"10.1093\/bioinformatics\/btq249","volume":"26","author":"NY Yu","year":"2010","unstructured":"Yu NY, Wagner JR, Laird MR, Melli G, Rey S, Lo R, Dao P, Sahinalp SC, Ester M, Foster LJ, Brinkman FS. PSORTb 3.0: improved protein subcellular localization prediction with refined localization subcategories and predictive capabilities for all prokaryotes. Bioinformatics. 2010; 26(13):1608\u201315. https:\/\/doi.org\/10.1093\/bioinformatics\/btq249 .","journal-title":"Bioinformatics"},{"issue":"Web Server issu","key":"2021_CR8","doi-asserted-by":"publisher","first-page":"350","DOI":"10.1093\/nar\/gku396","volume":"42","author":"T Goldberg","year":"2014","unstructured":"Goldberg T, Hecht M, Hamp T, Karl T, Yachdav G, Ahmed N, Altermann U, Angerer P, Ansorge S, Balasz K, Bernhofer M, Betz A, Cizmadija L, Do KT, Gerke J, Greil R, Joerdens V, Hastreiter M, Hembach K, Herzog M, Kalemanov M, Kluge M, Meier A, Nasir H, Neumaier U, Prade V, Reeb J, Sorokoumov A, Troshani I, Vorberg S, Waldraff S, Zierer J, Nielsen H, Rost B. LocTree3 prediction of localization. Nucleic Acids Res. 2014; 42(Web Server issue):350\u20135. https:\/\/doi.org\/10.1093\/nar\/gku396 .","journal-title":"Nucleic Acids Res"},{"key":"2021_CR9","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1007\/978-1-4939-3167-5_2","volume":"1374","author":"E Boutet","year":"2016","unstructured":"Boutet E, Lieberherr D, Tognolli M, Schneider M, Bansal P, Bridge AJ, Poux S, Bougueleret L, Xenarios I. UniProtKB\/Swiss-Prot, the Manually Annotated Section of the UniProt KnowledgeBase: How to Use the Entry View. Methods Mol Biol. 2016; 1374:23\u201354.","journal-title":"Methods Mol Biol"},{"issue":"D1","key":"2021_CR10","doi-asserted-by":"publisher","first-page":"663","DOI":"10.1093\/nar\/gkw1016","volume":"45","author":"LS Gramates","year":"2017","unstructured":"Gramates LS, Marygold SJ, Santos GD, Urbano JM, Antonazzo G, Matthews BB, Rey AJ, Tabone CJ, Crosby MA, Emmert DB, Falls K, Goodman JL, Hu Y, Ponting L, Schroeder AJ, Strelets VB, Thurmond J, Zhou P, the FlyBase Consortium. FlyBase at 25: looking to the future. Nucleic Acids Res. 2017; 45(D1):663\u201371. https:\/\/doi.org\/10.1093\/nar\/gkw1016 .","journal-title":"Nucleic Acids Res"},{"issue":"4","key":"2021_CR11","doi-asserted-by":"publisher","first-page":"547","DOI":"10.1093\/bioinformatics\/btg447","volume":"20","author":"Z Lu","year":"2004","unstructured":"Lu Z, Szafron D, Greiner R, Lu P, Wishart DS, Poulin B, Anvik J, Macdonell C, Eisner R. Predicting subcellular localization of proteins using machine-learned classifiers. Bioinformatics. 2004; 20(4):547\u20136. https:\/\/doi.org\/10.1093\/bioinformatics\/bth026 .","journal-title":"Bioinformatics"},{"issue":"11","key":"2021_CR12","doi-asserted-by":"publisher","first-page":"1410","DOI":"10.1093\/bioinformatics\/btm115","volume":"23","author":"H Shatkay","year":"2007","unstructured":"Shatkay H, Hoglund A, Brady S, Blum T, Donnes P, Kohlbacher O. SherLoc: high-accuracy prediction of protein subcellular localization by integrating text and protein sequence data. Bioinformatics. 2007; 23(11):1410\u20137. https:\/\/doi.org\/10.1093\/bioinformatics\/btm115 .","journal-title":"Bioinformatics"},{"key":"2021_CR13","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1093\/bioinformatics\/18.suppl_1.S78","volume":"18 Suppl 1","author":"R Nair","year":"2002","unstructured":"Nair R, Rost B. Inferring sub-cellular localization through automated lexical analysis. Bioinformatics. 2002; 18 Suppl 1:78\u201386.","journal-title":"Bioinformatics"},{"key":"2021_CR14","doi-asserted-by":"crossref","unstructured":"Mao Y, Van Auken K, Li D, Arighi CN, McQuilton P, Hayman GT, Tweedie S, Schaeffer ML, Laulederkind SJ, Wang SJ, Gobeill J, Ruch P, Luu AT, Kim JJ, Chiang JH, Chen YD, Yang CJ, Liu H, Zhu D, Li Y, Yu H, Emadzadeh E, Gonzalez G, Chen JM, Dai HJ, Lu Z. Overview of the gene ontology task at biocreative iv. Database (Oxford) 2014;2014. https:\/\/doi.org\/10.1093\/database\/bau086 .","DOI":"10.1093\/database\/bau086"},{"issue":"11","key":"2021_CR15","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1371\/journal.pbio.0020309","volume":"2","author":"HM Muller","year":"2004","unstructured":"Muller HM, Kenny EE, Sternberg PW. Textpresso: an ontology-based information retrieval and extraction system for biological literature. PLoS Biol. 2004; 2(11):309. https:\/\/doi.org\/10.1371\/journal.pbio.0020309 .","journal-title":"PLoS Biol"},{"issue":"Database issue","key":"2021_CR16","doi-asserted-by":"publisher","first-page":"789","DOI":"10.1093\/nar\/gkt1063","volume":"42","author":"TW Harris","year":"2014","unstructured":"Harris TW, Baran J, Bieri T, Cabunoc A, Chan J, Chen WJ, Davis P, Done J, Grove C, Howe K, Kishore R, Lee R, Li Y, Muller HM, Nakamura C, Ozersky P, Paulini M, Raciti D, Schindelman G, Tuli MA, Van Auken K, Wang D, Wang X, Williams G, Wong JD, Yook K, Schedl T, Hodgkin J, Berriman M, Kersey P, Spieth J, Stein L, Sternberg PW. WormBase 2014: new views of curated biology. Nucleic Acids Res. 2014; 42(Database issue):789\u201393. https:\/\/doi.org\/10.1093\/nar\/gkt1063 .","journal-title":"Nucleic Acids Res"},{"key":"2021_CR17","doi-asserted-by":"publisher","first-page":"228","DOI":"10.1186\/1471-2105-10-228","volume":"10","author":"K Van Auken","year":"2009","unstructured":"Van Auken K, Jaffery J, Chan J, Muller HM, Sternberg PW. Semi-automated curation of protein subcellular localization: a text mining-based approach to gene ontology (go) cellular component curation. BMC Bioinformatics. 2009; 10:228. https:\/\/doi.org\/10.1186\/1471-2105-10-228 .","journal-title":"BMC Bioinformatics"},{"key":"2021_CR18","doi-asserted-by":"publisher","first-page":"040","DOI":"10.1093\/database\/bas040","volume":"2012","author":"K Van Auken","year":"2012","unstructured":"Van Auken K, Fey P, Berardini TZ, Dodson R, Cooper L, Li D, Chan J, Li Y, Basu S, Muller HM, Chisholm R, Huala E, Sternberg PW, WormBase C. Text mining in the biocuration workflow: applications for literature curation at WormBase, dictyBase and TAIR. Database (Oxford). 2012; 2012:040. https:\/\/doi.org\/10.1093\/database\/bas040 .","journal-title":"Database (Oxford)"},{"key":"2021_CR19","doi-asserted-by":"publisher","first-page":"056","DOI":"10.1093\/database\/bas056","volume":"2013","author":"CN Arighi","year":"2013","unstructured":"Arighi CN, Carterette B, Cohen KB, Krallinger M, Wilbur WJ, Fey P, Dodson R, Cooper L, Van Slyke CE, Dahdul W, Mabee P, Li D, Harris B, Gillespie M, Jimenez S, Roberts P, Matthews L, Becker K, Drabkin H, Bello S, Licata L, Chatr-aryamontri A, Schaeffer ML, Park J, Haendel M, Van Auken K, Li Y, Chan J, Muller HM, Cui H, Balhoff JP, Chi-Yang Wu J, Lu Z, Wei CH, Tudor CO, Raja K, Subramani S, Natarajan J, Cejuela JM, Dubey P, Wu C. An overview of the BioCreative 2012 Workshop Track III: interactive text mining task. Database (Oxford). 2013; 2013:056. https:\/\/doi.org\/10.1093\/database\/bas056 .","journal-title":"Database (Oxford)"},{"key":"2021_CR20","doi-asserted-by":"crossref","unstructured":"Wang Q, S SA, Almeida L, Ananiadou S, Balderas-Martinez YI, Batista-Navarro R, Campos D, Chilton L, Chou HJ, Contreras G, Cooper L, Dai HJ, Ferrell B, Fluck J, Gama-Castro S, George N, Gkoutos G, Irin AK, Jensen LJ, Jimenez S, Jue TR, Keseler I, Madan S, Matos S, McQuilton P, Milacic M, Mort M, Natarajan J, Pafilis E, Pereira E, Rao S, Rinaldi F, Rothfels K, Salgado D, Silva RM, Singh O, Stefancsik R, Su CH, Subramani S, Tadepally HD, Tsaprouni L, Vasilevsky N, Wang X, Chatr-Aryamontri A, Laulederkind SJ, Matis-Mitchell S, McEntyre J, Orchard S, Pundir S, Rodriguez-Esteban R, Van Auken K, Lu Z, Schaeffer M, Wu CH, Hirschman L, Arighi CN. Overview of the interactive task in BioCreative V. Database (Oxford). 2016; 2016. https:\/\/doi.org\/10.1093\/database\/baw119 .","DOI":"10.1093\/database\/baw119"},{"issue":"D1","key":"2021_CR21","doi-asserted-by":"publisher","first-page":"158","DOI":"10.1093\/nar\/gkw1099","volume":"45","author":"The UniProt Consortium","year":"2017","unstructured":"The UniProt Consortium. Uniprot: the universal protein knowledgebase. Nucleic Acids Res. 2017; 45(D1):158\u201369. https:\/\/doi.org\/10.1093\/nar\/gkw1099 .","journal-title":"Nucleic Acids Res"},{"key":"2021_CR22","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1186\/1471-2105-6-51","volume":"6","author":"BT Alako","year":"2005","unstructured":"Alako BT, Veldhoven A, van Baal S, Jelier R, Verhoeven S, Rullmann T, Polman J, Jenster G. CoPub Mapper: mining MEDLINE based on search term co-publication. BMC Bioinformatics. 2005; 6:51. https:\/\/doi.org\/10.1186\/1471-2105-6-51 .","journal-title":"BMC Bioinformatics"},{"issue":"2","key":"2021_CR23","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1093\/bioinformatics\/btl302","volume":"23","author":"D Rebholz-Schuhmann","year":"2007","unstructured":"Rebholz-Schuhmann D, Kirsch H, Arregui M, Gaudan S, Riethoven M, Stoehr P. EBIMed\u2013text crunching to gather facts for proteins from Medline. Bioinformatics. 2007; 23(2):237\u201344. https:\/\/doi.org\/10.1093\/bioinformatics\/btl302 .","journal-title":"Bioinformatics"},{"key":"2021_CR24","doi-asserted-by":"publisher","first-page":"012","DOI":"10.1093\/database\/bau012","volume":"2014","author":"JX Binder","year":"2014","unstructured":"Binder JX, Pletscher-Frankild S, Tsafou K, Stolte C, O\u2019Donoghue SI, Schneider R, Jensen LJ. Compartments: unification and visualization of protein subcellular localization evidence. Database (Oxford). 2014; 2014:012. https:\/\/doi.org\/10.1093\/database\/bau012 .","journal-title":"Database (Oxford)"},{"key":"2021_CR25","doi-asserted-by":"crossref","unstructured":"Stapley BJ, Kelley LA, Sternberg MJ. Predicting the sub-cellular location of proteins from text using support vector machines. Pac Symp Biocomput. 2002::374\u201385. https:\/\/www.ncbi.nlm.nih.gov\/pubmed\/11928491 .","DOI":"10.1142\/9789812799623_0035"},{"issue":"21","key":"2021_CR26","doi-asserted-by":"publisher","first-page":"2512","DOI":"10.1093\/bioinformatics\/btn463","volume":"24","author":"A Fyshe","year":"2008","unstructured":"Fyshe A, Liu Y, Szafron D, Greiner R, Lu P. Improving subcellular localization prediction using text classification and the gene ontology. Bioinformatics. 2008; 24(21):2512\u20137. https:\/\/doi.org\/10.1093\/bioinformatics\/btn463 .","journal-title":"Bioinformatics"},{"key":"2021_CR27","doi-asserted-by":"crossref","unstructured":"Kim MY. Detection of protein subcellular localization based on a full syntactic parser and semantic information. In: 2008 Fifth International Conference on Fuzzy Systems and Knowledge Discovery, vol. 4: 2008. p. 407\u201311. https:\/\/doi.org\/10.1109\/FSKD.2008.529 .","DOI":"10.1109\/FSKD.2008.529"},{"key":"2021_CR28","volume-title":"Proceedings of the Workshop on Current Trends in Biomedical Natural Language Processing: Shared Task","author":"JD Kim","year":"2009","unstructured":"Kim JD, Ohta T, Pyysalo S, Tsujii YKJ. Overview of BioNLP\u201909 shared task on event extraction. In: Proceedings of the Workshop on Current Trends in Biomedical Natural Language Processing: Shared Task. Boulder, Colorado: Association for Computational Linguistics: 2009. p. 1\u20139."},{"key":"2021_CR29","volume-title":"Proceedings of the BioNLP Shared Task 2011 Workshop","author":"JD Kim","year":"2011","unstructured":"Kim JD, Wang Y, Takagi T, Yonezawa A. Overview of Genia event task in BioNLP Shared Task 2011. In: Proceedings of the BioNLP Shared Task 2011 Workshop. Portland, Oregon: Association for Computational Linguistics: 2011. p. 7\u201315."},{"key":"2021_CR30","volume-title":"Human Language Technologies 2007: The Conference of the North American Chapter of the Association for Computational Linguistics; Companion Volume, Short Papers","author":"Y Liu","year":"2007","unstructured":"Liu Y, Shi Z, Sarkar A. Exploiting rich syntactic information for relation extraction from biomedical articles. In: Human Language Technologies 2007: The Conference of the North American Chapter of the Association for Computational Linguistics; Companion Volume, Short Papers. Rochester: Association for Computational Linguistics: 2007. p. 97\u2013100."},{"key":"2021_CR31","doi-asserted-by":"publisher","first-page":"134","DOI":"10.1016\/j.jbi.2015.07.013","volume":"57","author":"W Zheng","year":"2015","unstructured":"Zheng W, Blake C. Using distant supervised learning to identify protein subcellular localizations from full-text scientific articles. J Biomed Inform. 2015; 57:134\u201344. https:\/\/doi.org\/10.1016\/j.jbi.2015.07.013 .","journal-title":"J Biomed Inform"},{"issue":"8","key":"2021_CR32","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1371\/journal.pmed.0020124","volume":"2","author":"JPA Ioannidis","year":"2005","unstructured":"Ioannidis JPA. Why most published research findings are false. PLoS Med. 2005; 2(8):124. https:\/\/doi.org\/10.1371\/journal.pmed.0020124 .","journal-title":"PLoS Med"},{"issue":"9976","key":"2021_CR33","doi-asserted-by":"publisher","first-page":"1380","DOI":"10.1016\/S0140-6736(15)60696-1","volume":"385","author":"R Horton","year":"2015","unstructured":"Horton R. Offline: What is medicine\u2019s 5 sigma?Lancet. 2015; 385(9976):1380. https:\/\/doi.org\/10.1016\/S0140-6736(15)60696-1 .","journal-title":"Lancet"},{"issue":"9","key":"2021_CR34","doi-asserted-by":"publisher","first-page":"643","DOI":"10.1038\/nrd3545","volume":"10","author":"A Mullard","year":"2011","unstructured":"Mullard A. Reliability of \u2019new drug target\u2019 claims called into question. Nat Rev Drug Discov. 2011; 10(9):643\u20134.","journal-title":"Nat Rev Drug Discov"},{"issue":"Suppl 5","key":"2021_CR35","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1186\/1753-6561-9-S5-A4","volume":"9","author":"T Goldberg","year":"2015","unstructured":"Goldberg T, Vinchurkar S, Cejuela JM, Jensen LJ, Rost B. Linked annotations: a middle ground for manual curation of biomedical databases and text corpora. BMC Proc. 2015; 9(Suppl 5):4\u20134. https:\/\/doi.org\/10.1186\/1753-6561-9-S5-A4 .","journal-title":"BMC Proc"},{"key":"2021_CR36","doi-asserted-by":"crossref","unstructured":"Cejuela JM, Bojchevski A, Uhlig C, Bekmukhametov R, Kumar Karn S, Mahmuti S, Baghudana A, Dubey A, Satagopam VP, Rost B. nala: text mining natural language mutation mentions. Bioinformatics. 2017. https:\/\/doi.org\/10.1093\/bioinformatics\/btx083 .","DOI":"10.1093\/bioinformatics\/btx083"},{"issue":"Database issue","key":"2021_CR37","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1093\/nar\/gku1003","volume":"43","author":"D Szklarczyk","year":"2015","unstructured":"Szklarczyk D, Franceschini A, Wyder S, Forslund K, Heller D, Huerta-Cepas J, Simonovic M, Roth A, Santos A, Tsafou KP, Kuhn M, Bork P, Jensen LJ, von Mering C. STRING v10: protein-protein interaction networks, integrated over the tree of life. Nucleic Acids Res. 2015; 43(Database issue):447\u201352. https:\/\/doi.org\/10.1093\/nar\/gku1003 .","journal-title":"Nucleic Acids Res"},{"issue":"3","key":"2021_CR38","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes C, Vapnik V. Support-vector networks. Mach Learn. 1995; 20(3):273\u201397. https:\/\/doi.org\/10.1007\/BF00994018 .","journal-title":"Mach Learn"},{"key":"2021_CR39","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V, Vanderplas J, Passos A, Cournapeau D, Brucher M, Perrot M, Duchesnay \u00c9. Scikit-learn: Machine learning in python. J Mach Learn Res. 2011; 12:2825\u201330.","journal-title":"J Mach Learn Res"},{"issue":"3","key":"2021_CR40","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1961189.1961199","volume":"2","author":"CC Chang","year":"2011","unstructured":"Chang CC, Lin CJ. LIBSVM: A library for support vector machines. ACM Trans Intell Syst Technol. 2011; 2(3):1\u201327. https:\/\/doi.org\/10.1145\/1961189.1961199 .","journal-title":"ACM Trans Intell Syst Technol"},{"key":"2021_CR41","doi-asserted-by":"crossref","unstructured":"Collins M, Duffy N. Convolution kernels for natural language. In: Proceedings of the 14th Conference on Neural Information Processing Systems. Collins:Duffy:01: 2001. http:\/\/books.nips.cc\/papers\/files\/nips14\/AA58.pdf . Accessed Apr 2017.","DOI":"10.7551\/mitpress\/1120.003.0085"},{"key":"2021_CR42","unstructured":"Joachims T. Transductive inference for text classification using support vector machines. In: Proceedings of the Sixteenth International Conference on Machine Learning. Morgan Kaufmann Publishers Inc.: 1999. p. 200\u20139. 657646."},{"key":"2021_CR43","unstructured":"Moschitti A. Making Tree Kernels Practical for Natural Language Learning. In: 11th Conference of the European Chapter of the Association for Computational Linguistics: 2006. p. 113\u2013120. http:\/\/www.aclweb.org\/anthology\/E06-1015 ."},{"issue":"11","key":"2021_CR44","doi-asserted-by":"publisher","first-page":"1433","DOI":"10.1093\/bioinformatics\/btt156","volume":"29","author":"CH Wei","year":"2013","unstructured":"Wei CH, Harris BR, Kao HY, Lu Z. tmVar: a text mining approach for extracting sequence variants in biomedical literature. Bioinformatics. 2013; 29(11):1433\u20139. https:\/\/doi.org\/10.1093\/bioinformatics\/btt156 .","journal-title":"Bioinformatics"},{"key":"2021_CR45","doi-asserted-by":"crossref","unstructured":"Ng AY. Feature selection, L1 vs. L2 regularization, and rotational invariance. In: Proceedings of the Twenty-first International Conference on Machine Learning. ACM: 2004. p. 78. https:\/\/doi.org\/10.1145\/1015330.1015435 .","DOI":"10.1145\/1015330.1015435"},{"key":"2021_CR46","doi-asserted-by":"crossref","unstructured":"Bj\u00f6rne J, Heimonen J, Ginter F, Airola A, Pahikkala T, Salakoski T. Extracting complex biological events with rich graph-based feature sets. In: Proceedings of the Workshop on Current Trends in Biomedical Natural Language Processing: Shared Task. Association for Computational Linguistics: 2009. p. 10\u201318. 1572343.","DOI":"10.3115\/1572340.1572343"},{"key":"2021_CR47","doi-asserted-by":"crossref","unstructured":"Caporaso JG, Deshpande N, Fink JL, Bourne PE, Cohen KB, Hunter L. Intrinsic evaluation of text mining tools may not predict performance on realistic tasks; 2008. https:\/\/doi.org\/10.1142\/9789812776136_0061 . Accessed Apr 2017.","DOI":"10.1142\/9789812776136_0061"},{"issue":"1","key":"2021_CR48","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1093\/nar\/27.1.49","volume":"27","author":"A Bairoch","year":"1999","unstructured":"Bairoch A, Apweiler R. The SWISS-PROT protein sequence data bank and its supplement TrEMBL in 1999. Nucleic Acids Res. 1999; 27(1):49\u201354.","journal-title":"Nucleic Acids Res"},{"key":"2021_CR49","doi-asserted-by":"crossref","unstructured":"Van Auken K, Schaeffer ML, McQuilton P, Laulederkind SJ, Li D, Wang SJ, Hayman GT, Tweedie S, Arighi CN, Done J, Muller HM, Sternberg PW, Mao Y, Wei CH, Lu Z. BC4GO: a full-text corpus for the BioCreative IV GO task. Database (Oxford). 2014; 2014. https:\/\/doi.org\/10.1093\/database\/bau074 .","DOI":"10.1093\/database\/bau074"},{"issue":"0","key":"2021_CR50","doi-asserted-by":"publisher","first-page":"033","DOI":"10.1093\/database\/bau033","volume":"2014","author":"JM Cejuela","year":"2014","unstructured":"Cejuela JM, McQuilton P, Ponting L, Marygold SJ, Stefancsik R, Millburn GH, Rost B, FlyBase C. tagtog: interactive and text-mining-assisted annotation of gene mentions in PLOS full-text articles. Database (Oxford). 2014; 2014(0):033. https:\/\/doi.org\/10.1093\/database\/bau033 .","journal-title":"Database (Oxford)"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-018-2021-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,29]],"date-time":"2025-06-29T22:05:25Z","timestamp":1751234725000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-018-2021-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,1,17]]},"references-count":50,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["2021"],"URL":"https:\/\/doi.org\/10.1186\/s12859-018-2021-9","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,1,17]]},"assertion":[{"value":"25 April 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 January 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 January 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Not applicable.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}},{"value":"Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Publisher\u2019s Note"}}],"article-number":"15"}}