{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T18:09:57Z","timestamp":1767895797956,"version":"3.49.0"},"reference-count":112,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2018,4,12]],"date-time":"2018-04-12T00:00:00Z","timestamp":1523491200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100004963","name":"Seventh Framework Programme","doi-asserted-by":"publisher","award":["FP7\/2007-2013"],"award-info":[{"award-number":["FP7\/2007-2013"]}],"id":[{"id":"10.13039\/501100004963","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Biomed Semant"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1186\/s13326-018-0181-1","type":"journal-article","created":{"date-parts":[[2018,4,12]],"date-time":"2018-04-12T06:20:01Z","timestamp":1523514001000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":33,"title":["Deep learning meets ontologies: experiments to anchor the cardiovascular disease ontology in the biomedical literature"],"prefix":"10.1186","volume":"9","author":[{"given":"Mercedes","family":"Arguello Casteleiro","sequence":"first","affiliation":[]},{"given":"George","family":"Demetriou","sequence":"additional","affiliation":[]},{"given":"Warren","family":"Read","sequence":"additional","affiliation":[]},{"given":"Maria Jesus","family":"Fernandez Prieto","sequence":"additional","affiliation":[]},{"given":"Nava","family":"Maroto","sequence":"additional","affiliation":[]},{"given":"Diego","family":"Maseda Fernandez","sequence":"additional","affiliation":[]},{"given":"Goran","family":"Nenadic","sequence":"additional","affiliation":[]},{"given":"Julie","family":"Klein","sequence":"additional","affiliation":[]},{"given":"John","family":"Keane","sequence":"additional","affiliation":[]},{"given":"Robert","family":"Stevens","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,4,12]]},"reference":[{"key":"181_CR1","unstructured":"sysVASC project, http:\/\/cordis.europa.eu\/project\/rcn\/111200_en.html . Accessed 2 Aug 2017."},{"key":"181_CR2","unstructured":"World Health Organization \u2013 Cardiovascular diseases (CVDs). Available at http:\/\/www.who.int\/cardiovascular_diseases\/en\/ . Accessed 2 Aug 2017."},{"issue":"1","key":"181_CR3","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1186\/2041-1480-4-28","volume":"4","author":"D Rebholz-Schuhmann","year":"2013","unstructured":"Rebholz-Schuhmann D, Kafkas S, Kim JH, Li C, Yepes AJ, Hoehndorf R, Backofen R, Lewin I. Evaluating gold standard corpora against gene\/protein tagging solutions and lexical resources. Journal of biomedical semantics. 2013;4(1):28.","journal-title":"Journal of biomedical semantics"},{"issue":"suppl 1","key":"181_CR4","doi-asserted-by":"publisher","first-page":"D115","DOI":"10.1093\/nar\/gkh131","volume":"32","author":"R Apweiler","year":"2004","unstructured":"Apweiler R, Bairoch A, Wu CH, Barker WC, Boeck-mann B, Ferro S, Gasteiger E, Huang H, Lopez R, Ma-grane M, Martin MJ. UniProt: the universal protein knowledgebase. Nucleic Acids Res. 2004;32(suppl 1):D115\u20139.","journal-title":"Nucleic Acids Res"},{"key":"181_CR5","volume-title":"Conditional random fields: probabilistic models for segmenting and labeling sequence data","author":"J Lafferty","year":"2001","unstructured":"Lafferty, J., McCallum, A. and Pereira, F., . Conditional random fields: probabilistic models for segmenting and labeling sequence data. 2001."},{"issue":"14","key":"181_CR6","doi-asserted-by":"publisher","first-page":"3191","DOI":"10.1093\/bioinformatics\/bti475","volume":"21","author":"B Settles","year":"2005","unstructured":"Settles B. ABNER: an open source tool for automatically tagging genes, proteins and other entity names in text. Bioinformatics. 2005;21(14):3191\u20132.","journal-title":"Bioinformatics"},{"key":"181_CR7","first-page":"652","volume-title":"Pacific symposium on biocomputing","author":"R Leaman","year":"2008","unstructured":"Leaman R, Gonzalez G. BANNER: an executable survey of advances in biomedical named entity recognition. In: Pacific symposium on biocomputing, vol. 13; 2008. p. 652\u201363."},{"key":"181_CR8","doi-asserted-by":"publisher","unstructured":"Hirschman L, Burns GAC, Krallinger M, Arighi C, Cohen KB, Valencia A, Wu CH, Chatr-Aryamontri A, Dowell KG, Huala E, Louren\u00e7o A. Text mining for the biocuration workflow. Database (Oxford). 2012;2012:bas020. https:\/\/doi.org\/10.1093\/database\/bas020 . Print 2012.","DOI":"10.1093\/database\/bas020"},{"issue":"12","key":"181_CR9","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1038\/nrg3337","volume":"13","author":"D Rebholz-Schuhmann","year":"2012","unstructured":"Rebholz-Schuhmann D, Oellrich A, Hoehndorf R. Text-mining solutions for biomedical research: enabling integrative biology. Nat Rev Genet. 2012;13(12):829.","journal-title":"Nat Rev Genet"},{"issue":"1","key":"181_CR10","doi-asserted-by":"publisher","first-page":"372","DOI":"10.1186\/1471-2105-7-372","volume":"7","author":"K Fundel","year":"2006","unstructured":"Fundel K, Zimmer R. Gene and protein nomenclature in public databases. Bmc Bioinformatics. 2006;7(1):372.","journal-title":"Bmc Bioinformatics"},{"issue":"1\u20132","key":"181_CR11","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1002\/cfg.452","volume":"6","author":"I Mani","year":"2005","unstructured":"Mani I, Hu Z, Jang SB, Samuel K, Krause M, Phillips J, Wu CH. Protein name tagging guidelines: lessons learned. Comparative and Functional Genomics. 2005;6(1\u20132):72\u20136.","journal-title":"Comparative and Functional Genomics"},{"issue":"suppl_1","key":"181_CR12","first-page":"D52","volume":"39","author":"D Maglott","year":"2010","unstructured":"Maglott D, Ostell J, Pruitt KD, Tatusova T. Entrez gene: gene-centered information at NCBI. Nucleic Acids Res. 2010;39(suppl_1):D52\u20137.","journal-title":"Nucleic Acids Res"},{"issue":"7553","key":"181_CR13","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton G. Deep learning. Nature. 2015;521(7553):436\u201344.","journal-title":"Nature"},{"issue":"1","key":"181_CR14","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1016\/S0004-3702(97)00063-5","volume":"97","author":"AL Blum","year":"1997","unstructured":"Blum AL, Langley P. Selection of relevant features and examples in machine learning. Artif Intell. 1997;97(1):245\u201371.","journal-title":"Artif Intell"},{"issue":"1","key":"181_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani F. Machine learning in automated text categorization. ACM computing surveys (CSUR). 2002;34(1):1\u201347.","journal-title":"ACM computing surveys (CSUR)"},{"key":"181_CR16","volume-title":"Advances in neural information processing systems, pp. 3111\u20133119","author":"T Mikolov","year":"2013","unstructured":"Mikolov T, Sutskever I, Chen K, Corrado GS, Dean J. Distributed representations of words and phrases and their compositionality. In: Advances in neural information processing systems, pp. 3111\u20133119; 2013."},{"key":"181_CR17","volume-title":"Proceedings of the international conference on learning representations (ICLR)","author":"T Mikolov","year":"2013","unstructured":"Mikolov T, Chen K, Corrado G, Dean J. Efficient estimation of word representations in vector space. In: Proceedings of the international conference on learning representations (ICLR); 2013."},{"key":"181_CR18","first-page":"12","volume":"2016","author":"MT Pilehvar","year":"2016","unstructured":"Pilehvar MT, Collier N. Improved semantic representation for domain-specific entities. ACL. 2016;2016:12.","journal-title":"ACL"},{"key":"181_CR19","unstructured":"Minarro-Gim\u00e9nez JA, Mar\u00edn-Alonso O, Samwald M. Exploring the application of deep learning techniques on medical text corpora. In: E-health \u2013 for continuity of care: IOS Press. Stud Health Technol Inform. 2014;205:584\u20138. (PMID:25160253)."},{"key":"181_CR20","doi-asserted-by":"publisher","unstructured":"Bengio Y, Lee H. Editorial introduction to the neural networks special issue on deep learning of representations. Neural Netw. 2015;64:1-3. https:\/\/doi.org\/10.1016\/j.neunet.2014.12.006 . Epub 2014 Dec 15. (PMID:25595998)","DOI":"10.1016\/j.neunet.2014.12.006"},{"issue":"2","key":"181_CR21","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1037\/0033-295X.104.2.211","volume":"104","author":"TK Landauer","year":"1997","unstructured":"Landauer TK, Dumais ST. A solution to Plato's problem: the latent semantic analysis theory of acquisition, induction, and representation of knowledge. Psychol Rev. 1997;104(2):211.","journal-title":"Psychol Rev"},{"issue":"2","key":"181_CR22","doi-asserted-by":"publisher","first-page":"203","DOI":"10.3758\/BF03204766","volume":"28","author":"K Lund","year":"1996","unstructured":"Lund K, Burgess C. Producing high-dimensional seman-tic spaces from lexical co-occurrence. Behav Res Methods Instrum Comput. 1996;28(2):203\u20138.","journal-title":"Behav Res Methods Instrum Comput"},{"key":"181_CR23","volume-title":"Random indexing of text samples for latent semantic analysis. In proc. of the cog-nitive science society (Vol. 1036)","author":"P Kanerva","year":"2000","unstructured":"Kanerva P, Kristofersson J, Holst A. Random indexing of text samples for latent semantic analysis. In proc. of the cog-nitive science society (Vol. 1036). Erlbaum: Mahwah, NJ; 2000."},{"key":"181_CR24","volume-title":"Proc. of ACM SIGIR conference on research and development in in-formation retrieval. ACM. Pp. 50\u201357","author":"T Hofmann","year":"1999","unstructured":"Hofmann T. Probabilistic latent semantic indexing. In: Proc. of ACM SIGIR conference on research and development in in-formation retrieval. ACM. Pp. 50\u201357; 1999."},{"key":"181_CR25","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei DM, Ng AY, Jordan MI. Latent dirichlet allocation. J Mach Learn Res. 2003;3:993\u20131022.","journal-title":"J Mach Learn Res"},{"issue":"2","key":"181_CR26","doi-asserted-by":"publisher","first-page":"390","DOI":"10.1016\/j.jbi.2009.02.002","volume":"42","author":"T Cohen","year":"2009","unstructured":"Cohen T, Widdows D. Empirical distributional semantics: methods and biomedical applications. J Biomed Inform. 2009;42(2):390\u2013405.","journal-title":"J Biomed Inform"},{"key":"181_CR27","first-page":"1059","volume":"2014","author":"A Neelakantan","year":"2014","unstructured":"Neelakantan A, Shankar J, Passos A, McCallum A. Efficient non-parametric estimation of multiple embeddings per word in vector space. EMNLP. 2014;2014:1059\u201369.","journal-title":"EMNLP"},{"key":"181_CR28","doi-asserted-by":"publisher","first-page":"1108","DOI":"10.1016\/j.neucom.2015.07.046","volume":"171","author":"B Hu","year":"2016","unstructured":"Hu B, Tang B, Chen Q, Kang L. A novel word em-bedding learning model using the dissociation between nouns and verbs. Neurocomputing. 2016;171:1108\u201317.","journal-title":"Neurocomputing"},{"key":"181_CR29","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1162\/tacl_a_00134","volume":"3","author":"O Levy","year":"2015","unstructured":"Levy O, Goldberg Y, Dagan I. Improving distributional similarity with lessons learned from word embeddings. Transactions of the Association for Computational Linguistics. 2015;3:211\u201325.","journal-title":"Transactions of the Association for Computational Linguistics"},{"key":"181_CR30","volume-title":"Proc. of languages in biology and medicine","author":"S Pyysalo","year":"2013","unstructured":"Pyysalo S, Ginter F, Moen H, Salakoski T, Ananiadou S. Distributional semantics resources for biomedical text pro-cessing. In: Proc. of languages in biology and medicine; 2013."},{"key":"181_CR31","unstructured":"Merck Manuals, https:\/\/www.msdmanuals.com\/en-gb \/. Accessed 2 Aug 2017."},{"key":"181_CR32","unstructured":"Medscape, http:\/\/www.medscape.com \/. Accessed 2 Aug 2017."},{"key":"181_CR33","unstructured":"Wikipedia, http:\/\/www.wikipedia.org \/. Accessed 2 Aug 2017."},{"issue":"3","key":"181_CR34","doi-asserted-by":"publisher","first-page":"288","DOI":"10.1016\/j.jbi.2006.06.004","volume":"40","author":"T Pedersen","year":"2007","unstructured":"Pedersen T, Pakhomov SV, Patwardhan S, Chute CG. Measures of semantic similarity and relatedness in the biomedical domain. J Biomed Inform. 2007;40(3):288\u201399.","journal-title":"J Biomed Inform"},{"key":"181_CR35","volume-title":"Simlex-999: evaluating semantic models with (genuine) similarity estimation","author":"F Hill","year":"2016","unstructured":"Hill, F., Reichart, R. and Korhonen, A., . Simlex-999: evaluating semantic models with (genuine) similarity estimation. Computational Linguistics 2016."},{"key":"181_CR36","unstructured":"Pakhomov S, McInnes B, Adam T, Liu Y, Pedersen T, Melton GB. Semantic similarity and relatedness between clinical terms: an experimental study. In: AMIA annual symposium proceedings (Vol. 2010, p. 572): American Medical Informatics Association; 2010."},{"key":"181_CR37","first-page":"448","volume-title":"Proceedings of the 14th international joint conference on artificial intelligence","author":"P Resnik","year":"1995","unstructured":"Resnik P. Using information content to evaluate semantic similarity in a taxonomy. In: Proceedings of the 14th international joint conference on artificial intelligence; 1995. p. 448\u201353."},{"issue":"2","key":"181_CR38","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1016\/j.jbi.2004.02.001","volume":"37","author":"JE Caviedes","year":"2004","unstructured":"Caviedes JE, Cimino JJ. Towards the development of a conceptual distance metric for the UMLS. J Biomed Inform. 2004;37(2):77\u201385.","journal-title":"J Biomed Inform"},{"issue":"1","key":"181_CR39","doi-asserted-by":"publisher","first-page":"116","DOI":"10.1145\/503104.503110","volume":"20","author":"L Finkelstein","year":"2002","unstructured":"Finkelstein L, Gabrilovich E, Matias Y, Rivlin E, Solan Z, Wolfman G, Ruppin E. Placing search in context: the concept revisited. ACM Trans Inf Syst. 2002;20(1):116\u201331.","journal-title":"ACM Trans Inf Syst"},{"issue":"2014","key":"181_CR40","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1613\/jair.4135","volume":"49","author":"E Bruni","year":"2014","unstructured":"Bruni E, Tran NK, Baroni M. Multimodal Distributional Semantics. J Artif Intell Res. 2014;49(2014):1\u201347.","journal-title":"J Artif Intell Res"},{"key":"181_CR41","doi-asserted-by":"crossref","unstructured":"Muneeb TH, Sahu SK, Anand A. Evaluating distributed word representations for capturing semantics of biomedical concepts: Proceedings of ACL-IJCNLP; 2015. p. 158.","DOI":"10.18653\/v1\/W15-3820"},{"key":"181_CR42","first-page":"166","volume":"2016","author":"B Chiu","year":"2016","unstructured":"Chiu B, Crichton G, Korhonen A, Pyysalo S. How to train good word embeddings for biomedical NLP. ACL. 2016;2016:166.","journal-title":"ACL"},{"key":"181_CR43","unstructured":"BioASQ challenge, http:\/\/bioasq.org \/. Accessed 2 August 2017."},{"key":"181_CR44","first-page":"491","volume-title":"Mining the web for synonyms: PMI-IR versus LSA on TOEFL","author":"PD Turney","year":"2001","unstructured":"Turney PD. Mining the web for synonyms: PMI-IR versus LSA on TOEFL. Freiburg, Germany: Proceedings of the Twelfth European Conference on Machine Learning (ECML-2001); 2001. p. 491\u2013502."},{"key":"181_CR45","unstructured":"BioCreative challenge, http:\/\/www.biocreative.org\/about\/background\/description\/ . Accessed 2 August 2017."},{"issue":"2","key":"181_CR46","doi-asserted-by":"publisher","first-page":"S2","DOI":"10.1186\/gb-2008-9-s2-s2","volume":"9","author":"L Smith","year":"2008","unstructured":"Smith L, Tanabe LK, nee Ando RJ, Kuo CJ, Chung IF, Hsu CN, Lin YS, Klinger R, Friedrich CM, Ganchev K, Torii M. Overview of BioCreative II gene mention recognition. Genome Biol. 2008;9(2):S2.","journal-title":"Genome Biol"},{"issue":"2","key":"181_CR47","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1093\/bioinformatics\/17.2.155","volume":"17","author":"T Ono","year":"2001","unstructured":"Ono T, Hishigaki H, Tanigami A, Takagi T. Automated extraction of information on protein\u2013protein interactions from the biological literature. Bioinformatics. 2001;17(2):155\u201361.","journal-title":"Bioinformatics"},{"issue":"1","key":"181_CR48","first-page":"100","volume":"28","author":"JA Hartigan","year":"1979","unstructured":"Hartigan JA, Wong MA. Algorithm AS 136: a k-means clustering algorithm. Journal of the Royal Statistical Society. Series C (Applied Statistics). 1979;28(1):100\u20138.","journal-title":"Series C (Applied Statistics)"},{"key":"181_CR49","unstructured":"Ohta T, Pyysalo S, Tsujii JI, Ananiadou S. Open-domain anatomical entity mention detection. In: Proceedings of the workshop on detecting structure in scholarly discourse (pp. 27\u201336): Association for Computational Linguistics; 2012."},{"key":"181_CR50","unstructured":"Do\u011fan RI, Lu Z. An improved corpus of disease mentions in PubMed citations. In: Proceedings of the 2012 workshop on biomedical natural language processing (pp. 91\u201399): Association for Computational Linguistics; 2012."},{"key":"181_CR51","doi-asserted-by":"crossref","unstructured":"Kim JD, Ohta T, Tsuruoka Y, Tateisi Y, Collier N. Introduction to the bio-entity recognition task at JNLPBA. In: Proceedings of the international joint workshop on natural language processing in biomedicine and its applications (pp. 70\u201375): Association for Computational Linguistics; 2004.","DOI":"10.3115\/1567594.1567610"},{"issue":"suppl 1","key":"181_CR52","doi-asserted-by":"publisher","first-page":"i180","DOI":"10.1093\/bioinformatics\/btg1023","volume":"19","author":"JD Kim","year":"2003","unstructured":"Kim JD, Ohta T, Tateisi Y, Tsujii JI. GENIA corpus\u2014a semantically annotated corpus for bio-textmining. Bioinformatics. 2003;19(suppl 1):i180\u20132.","journal-title":"Bioinformatics"},{"key":"181_CR53","volume-title":"Medical subject headings: main headings, subheadings, and cross references used in the index Medicus and the National Library of medicine catalog","author":"National Library of Medicine","year":"1960","unstructured":"National Library of Medicine. Medical subject headings: main headings, subheadings, and cross references used in the index Medicus and the National Library of medicine catalog. 1st ed. Washington: U.S. Department of Health, Education, and Welfare; 1960.","edition":"1"},{"key":"181_CR54","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1016\/j.ymeth.2015.03.026","volume":"83","author":"L Li","year":"2015","unstructured":"Li L, Guo R, Jiang Z, Huang D. An approach to improve kernel-based protein\u2013protein interaction extraction by learning from large-scale network data. Methods. 2015;83:44\u201350.","journal-title":"Methods"},{"issue":"4","key":"181_CR55","first-page":"467","volume":"18","author":"PF Brown","year":"1992","unstructured":"Brown PF, Desouza PV, Mercer RL, Pietra VJD, Lai JC. Class-based n-gram models of natural language. Computational linguistics. 1992;18(4):467\u201379.","journal-title":"Computational linguistics"},{"issue":"3","key":"181_CR56","doi-asserted-by":"publisher","first-page":"S6","DOI":"10.1186\/1471-2105-9-S3-S6","volume":"9","author":"S Pyysalo","year":"2008","unstructured":"Pyysalo S, Airola A, Heimonen J, Bj\u00f6rne J, Ginter F, Salakoski T. Comparative analysis of five protein-protein interaction corpora. BMC bioinformatics. 2008;9(3):S6.","journal-title":"BMC bioinformatics"},{"issue":"Pt 1","key":"181_CR57","first-page":"268","volume":"11","author":"AR Aronson","year":"2004","unstructured":"Aronson AR, Mork JG, Gay CW, Humphrey SM, Rogers WJ. The NLM indexing initiative's medical text indexer. Medinfo. 2004;11(Pt 1):268\u201372.","journal-title":"Medinfo"},{"issue":"12","key":"181_CR58","doi-asserted-by":"publisher","first-page":"i339","DOI":"10.1093\/bioinformatics\/btv237","volume":"31","author":"K Liu","year":"2015","unstructured":"Liu K, Peng S, Wu J, Zhai C, Mamitsuka H, Zhu S. MeSHLabeler: improving the accuracy of large-scale MeSH indexing by integrating diverse evidence. Bioinformatics. 2015;31(12):i339\u201347.","journal-title":"Bioinformatics"},{"issue":"12","key":"181_CR59","doi-asserted-by":"publisher","first-page":"i70","DOI":"10.1093\/bioinformatics\/btw294","volume":"32","author":"S Peng","year":"2016","unstructured":"Peng S, You R, Wang H, Zhai C, Mamitsuka H, Zhu S. DeepMeSH: deep semantic representation for improving large-scale MeSH indexing. Bioinformatics. 2016;32(12):i70\u20139.","journal-title":"Bioinformatics"},{"key":"181_CR60","unstructured":"NDF-RT ontology, https:\/\/bioportal.bioontology.org\/ontologies\/NDFRT . Accessed 2 Aug 2017."},{"key":"181_CR61","doi-asserted-by":"publisher","unstructured":"K\u00f6hler S, Doelken SC, Mungall CJ, Bauer S, Firth HV, Bailleul-Forestier I, Black GC, Brown DL, Brudno M, Campbell J, FitzPatrick DR. The human phenotype ontology project: linking molecular biology and disease through phenotype data. Nucleic Acids Res. 2014;42(Database issue):D966-74. https:\/\/doi.org\/10.1093\/nar\/gkt1026 . Epub 2013 Nov 11. (PMID:24217912)","DOI":"10.1093\/nar\/gkt1026"},{"key":"181_CR62","doi-asserted-by":"crossref","first-page":"231","DOI":"10.1162\/tacl_a_00179","volume":"2","author":"A Moro","year":"2014","unstructured":"Moro A, Raganato A, Navigli R. Entity linking meets word sense disambiguation: a unified approach. Transactions of the Association for Computational Linguistics. 2014;2:231\u201344.","journal-title":"Transactions of the Association for Computational Linguistics"},{"key":"181_CR63","first-page":"238","volume-title":"ACL (1)","author":"M Baroni","year":"2014","unstructured":"Baroni M, Dinu G, Kruszewski G. Don't count, predict! A systematic comparison of context-counting vs. context-predicting semantic vectors. In: ACL (1); 2014. p. 238\u201347."},{"key":"181_CR64","unstructured":"MEDLINE\/PubMed, https:\/\/www.nlm.nih.gov\/bsd\/pmresources.html . Accessed 2 Aug 2017."},{"issue":"2","key":"181_CR65","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1038\/nrg1768","volume":"7","author":"LJ Jensen","year":"2006","unstructured":"Jensen LJ, Saric J, Bork P. Literature mining for the biologist: from information retrieval to biological discovery. Nat Rev Genet. 2006;7(2):119.","journal-title":"Nat Rev Genet"},{"key":"181_CR66","unstructured":"UniProt AC versus ID, http:\/\/www.uniprot.org\/help\/difference_accession_entryname . Accessed 2 Aug 2017."},{"key":"181_CR67","unstructured":"UniProtKB AC P08107, http:\/\/www.uniprot.org\/uniprot\/P08107 . Accessed 2 Aug 2017."},{"issue":"suppl 1","key":"181_CR68","doi-asserted-by":"publisher","first-page":"D140","DOI":"10.1093\/nar\/gkj112","volume":"34","author":"S Griffiths-Jones","year":"2006","unstructured":"Griffiths-Jones S, Grocock RJ, Van Dongen S, Bateman A, Enright AJ. miRBase: microRNA sequences, targets and gene nomenclature. Nucleic Acids Res. 2006;34(suppl 1):D140\u20134.","journal-title":"Nucleic Acids Res"},{"issue":"suppl 1","key":"181_CR69","doi-asserted-by":"publisher","first-page":"D521","DOI":"10.1093\/nar\/gkl923","volume":"35","author":"DS Wishart","year":"2007","unstructured":"Wishart DS, Tzur D, Knox C, Eisner R, Guo AC, Young N, Cheng D, Jewell K, Arndt D, Sawhney S, Fung C. HMDB: the human metabolome database. Nucleic Acids Res. 2007;35(suppl 1):D521\u20136.","journal-title":"Nucleic Acids Res"},{"key":"181_CR70","unstructured":"OBI, http:\/\/www.obofoundry.org\/ontology\/obi.html . Accessed 2 Aug 2017."},{"key":"181_CR71","unstructured":"PRO, http:\/\/www.obofoundry.org\/ontology\/pr.html . Accessed 2 Aug 2017."},{"key":"181_CR72","unstructured":"SO, http:\/\/www.obofoundry.org\/ontology\/so.html . Accessed 2 Aug 2017."},{"key":"181_CR73","unstructured":"GO, http:\/\/www.obofoundry.org\/ontology\/go.html . Accessed 2 Aug 2017."},{"key":"181_CR74","unstructured":"ChEBI, http:\/\/www.obofoundry.org\/ontology\/chebi.html . Accessed 2 Aug 2017."},{"key":"181_CR75","unstructured":"CL, http:\/\/www.obofoundry.org\/ontology\/cl.html . Accessed 2 Aug 2017."},{"key":"181_CR76","unstructured":"UBERON, http:\/\/www.obofoundry.org\/ontology\/uberon.html . Accessed 2 Aug 2017."},{"key":"181_CR77","unstructured":"PATO, http:\/\/www.obofoundry.org\/ontology\/pato.html . Accessed 2 Aug 2017."},{"key":"181_CR78","unstructured":"RO, http:\/\/www.obofoundry.org\/ontology\/ro.html . Accessed 2 Aug 2017."},{"key":"181_CR79","unstructured":"UniProtKB donwloable files, http:\/\/www.uniprot.org\/downloads . Accessed 2 Aug 2017."},{"key":"181_CR80","doi-asserted-by":"crossref","unstructured":"Arguello Casteleiro M, Klein J, Stevens R. The Proteasix ontology. Journal of biomedical semantics. 2016;7(1)","DOI":"10.1186\/s13326-016-0078-9"},{"key":"181_CR81","unstructured":"Horridge M, Drummond N, Goodwin J, Rector AL, Stevens R, Wang H. The Manchester OWL syntax. In OWLed. 2006;216"},{"key":"181_CR82","unstructured":"Harris S, Seaborne A, Prud\u2019hommeaux E. SPARQL 1.1 query language. W3C Recommendation. 2013;21:10. Available online at https:\/\/www.w3.org\/TR\/sparql11-query\/ ."},{"key":"181_CR83","volume-title":"SKOS simple knowledge organi-zation system reference. W3C recommendation, 18, W3C","author":"A Miles","year":"2009","unstructured":"Miles, A. and Bechhofer, S.: SKOS simple knowledge organi-zation system reference. W3C recommendation, 18, W3C 2009."},{"key":"181_CR84","unstructured":"MEDLINE\u00ae\/PubMed\u00ae XML Data Elements, https:\/\/www.nlm.nih.gov\/bsd\/licensee\/data_elements_doc.html . Accessed 2 Aug 2017."},{"key":"181_CR85","volume-title":"Beautiful soup-HTML. XML parser for Python","author":"L Richardson","year":"2008","unstructured":"Richardson L. Beautiful soup-HTML. XML parser for Python. 2008."},{"key":"181_CR86","unstructured":"Bird S, Klein E, Loper E. Natural language processing with python: analyzing text with the natural language toolkit. O'Reilly Media, Inc.; 2009. ISBN: 0596516495 9780596516499."},{"issue":"1","key":"181_CR87","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/1471-2105-6-S1-S3","volume":"6","author":"L Tanabe","year":"2005","unstructured":"Tanabe L, Xie N, Thom LH, Matten W, Wilbur WJ. GENETAG: a tagged corpus for gene\/protein named entity recognition. BMC bioinformatics. 2005;6(1):S3.","journal-title":"BMC bioinformatics"},{"key":"181_CR88","unstructured":"word2vec, http:\/\/code.google.com\/p\/word2vec\/ . Accessed 2 Aug 2017."},{"key":"181_CR89","unstructured":"PubMed 14M dataset: list of PubMed IDs, http:\/\/pole-dl.cs.manchester.ac.uk\/experiments.html . Accessed 2 Aug 2017."},{"key":"181_CR90","unstructured":"Novak, Joseph D. and Ca\u00f1as, Alberto J. The theory underlying concept maps and how to construct and use them. Technical Report. Institute for Human and Machine Cognition, Pensacola. 2008 Available at: http:\/\/cmap.ihmc.us\/publications\/researchpapers\/theorycmaps\/theoryunderlyingconceptmaps.bck-11-01-06.htm . Accessed 2 Aug 2017."},{"key":"181_CR91","volume-title":"Proc. of computational linguistics (p. 604). Association for Computational Linguistics","author":"G Nenadic","year":"2004","unstructured":"Nenadic G, Ananiadou S, McNaught J. Enhancing automatic term recognition through recognition of variation. In: Proc. of computational linguistics (p. 604). Association for Computational Linguistics; 2004."},{"issue":"4","key":"181_CR92","doi-asserted-by":"publisher","first-page":"597","DOI":"10.1162\/coli.08-003-R1-07-044","volume":"34","author":"T Cohn","year":"2008","unstructured":"Cohn T, Callison-Burch C, Lapata M. Constructing corpora for the development and evaluation of paraphrase systems. Computational Linguistics. 2008;34(4):597\u2013614.","journal-title":"Computational Linguistics"},{"issue":"1","key":"181_CR93","doi-asserted-by":"publisher","first-page":"349","DOI":"10.1186\/1471-2105-10-349","volume":"10","author":"P Thompson","year":"2009","unstructured":"Thompson P, Iqbal SA, McNaught J, Ananiadou S. Construction of an annotated corpus to support biomedical information extraction. BMC bioinformatics. 2009;10(1):349.","journal-title":"BMC bioinformatics"},{"key":"181_CR94","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1177\/001316446002000104","volume":"20","author":"JA Cohen","year":"1960","unstructured":"Cohen JA. Coefficient of agreement for nominal scales. Educ Psychol Meas. 1960;20:37\u201346.","journal-title":"Educ Psychol Meas"},{"issue":"5","key":"181_CR95","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1037\/h0031619","volume":"76","author":"JL Fleiss","year":"1971","unstructured":"Fleiss JL. Measuring nominal scale agreement among many raters. Psychol Bull. 1971;76(5):378.","journal-title":"Psychol Bull"},{"issue":"4","key":"181_CR96","doi-asserted-by":"publisher","first-page":"555","DOI":"10.1162\/coli.07-034-R2","volume":"34","author":"R Artstein","year":"2008","unstructured":"Artstein R, Poesio M. Inter-coder agreement for computational linguistics. Computationa0l Linguistics. 2008;34(4):555\u201396.","journal-title":"Computationa0l Linguistics"},{"key":"181_CR97","doi-asserted-by":"crossref","unstructured":"Scott WA. Reliability of content analysis: the case of nominal scale coding. Public opinion quarterly. 1955:321\u20135.","DOI":"10.1086\/266577"},{"key":"181_CR98","unstructured":"Krippendorff K. Content analysis: an introduction to its methodology. Thousand Oaks: Sage; 2004."},{"issue":"8","key":"181_CR99","doi-asserted-by":"publisher","first-page":"861","DOI":"10.1016\/j.patrec.2005.10.010","volume":"27","author":"T Fawcett","year":"2006","unstructured":"Fawcett T. An introduction to ROC analysis. Pattern Recogn Lett. 2006;27(8):861\u201374.","journal-title":"Pattern Recogn Lett"},{"issue":"7","key":"181_CR100","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1016\/S0031-3203(96)00142-2","volume":"30","author":"AP Bradley","year":"1997","unstructured":"Bradley AP. The use of the area under the ROC curve in the evaluation of machine learning algorithms. Pattern Recogn. 1997;30(7):1145\u201359.","journal-title":"Pattern Recogn"},{"issue":"1","key":"181_CR101","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","volume":"143","author":"JA Hanley","year":"1982","unstructured":"Hanley JA, McNeil BJ. The meaning and use of the area under a receiver operating characteristic (ROC) curve. Radiology. 1982;143(1):29\u201336.","journal-title":"Radiology"},{"issue":"2","key":"181_CR102","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1023\/A:1010920819831","volume":"45","author":"DJ Hand","year":"2001","unstructured":"Hand DJ, Till RJ. A simple generalisation of the area under the ROC curve for multiple class classification problems. Mach Learn. 2001;45(2):171\u201386.","journal-title":"Mach Learn"},{"key":"181_CR103","unstructured":"Klf7 gene, https:\/\/www.ncbi.nlm.nih.gov\/gene?Db=gene&Cmd=DetailsSearch&Term=93691 . Accessed 2 Aug 2017."},{"issue":"1","key":"181_CR104","doi-asserted-by":"publisher","first-page":"S17","DOI":"10.1186\/1471-2105-6-S1-S17","volume":"6","author":"EB Camon","year":"2005","unstructured":"Camon EB, Barrell DG, Dimmer EC, Lee V, Magrane M, Maslen J, Binns D, Apweiler R. An evaluation of GO annotation retrieval for BioCreAtIvE and GOA. BMC bioinformatics. 2005;6(1):S17.","journal-title":"BMC bioinformatics"},{"issue":"12","key":"181_CR105","doi-asserted-by":"publisher","first-page":"571","DOI":"10.1016\/j.tibtech.2006.10.002","volume":"24","author":"S Ananiadou","year":"2006","unstructured":"Ananiadou S, Kell DB, Tsujii JI. Text mining and its potential applications in systems biology. Trends Biotechnol. 2006;24(12):571\u20139.","journal-title":"Trends Biotechnol"},{"issue":"4","key":"181_CR106","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1111\/j.1553-2712.1999.tb00392.x","volume":"6","author":"CS Federiuk","year":"1999","unstructured":"Federiuk CS. The effect of abbreviations on MEDLINE searching. Acad Emerg Med. 1999;6(4):292\u20136. (1999)","journal-title":"Acad Emerg Med"},{"issue":"suppl 1","key":"181_CR107","first-page":"D289","volume":"33","author":"JD Wren","year":"2005","unstructured":"Wren JD, Chang JT, Pustejovsky J, Adar E, Garner HR, Altman RB. Biomedical term mapping databases. Nucleic Acids Res. 2005;33(suppl 1):D289\u201393.","journal-title":"Nucleic Acids Res"},{"key":"181_CR108","doi-asserted-by":"crossref","unstructured":"Do\u011fan, I.R., Kim, S., Chatr-aryamontri, A., Chang, C.S., Oughtred, R., Rust, J., Wilbur, W.J., Comeau, D.C., Dolinski, K. and Tyers, M., . The BioC-BioGRID corpus: full text articles annotated for curation of protein\u2013protein and genetic interactions. Database, 2017 2017(1), p.baw147.","DOI":"10.1093\/database\/baw147"},{"issue":"W1","key":"181_CR109","doi-asserted-by":"publisher","first-page":"W518","DOI":"10.1093\/nar\/gkt441","volume":"41","author":"CH Wei","year":"2013","unstructured":"Wei CH, Kao HY, Lu Z. PubTator: a web-based text mining tool for assisting biocuration. Nucleic Acids Res. 2013;41(W1):W518\u201322.","journal-title":"Nucleic Acids Res"},{"key":"181_CR110","doi-asserted-by":"crossref","unstructured":"Lee, S., Kim, D., Lee, K., Choi, J., Kim, S., Jeon, M., Lim, S., Choi, D., Kim, S., Tan, A.C. and Kang, J., . BEST: next-generation biomedical entity search tool for knowledge discovery from biomedical literature. PLoS One, 2016 11(10), p.e0164680.","DOI":"10.1371\/journal.pone.0164680"},{"key":"181_CR111","volume-title":"Proceedings of semantic web applications and tools for the life sciences (SWAT4LS 2016)","author":"M Arguello Casteleiro","year":"2016","unstructured":"Arguello Casteleiro M, Fernandez-Prieto MJ, Demetriou G, Maroto N, Read W, Maseda-Fernandez D, Des-Diz J, Nenadic G, Keane J, Stevens R. Ontology learning with deep learning: a case study on patient safety using PubMed. In: Proceedings of semantic web applications and tools for the life sciences (SWAT4LS 2016); 2016. Available at http:\/\/ceur-ws.org\/Vol-1795\/paper12.pdf ."},{"issue":"suppl 2","key":"181_CR112","doi-asserted-by":"publisher","first-page":"W170","DOI":"10.1093\/nar\/gkp440","volume":"37","author":"NF Noy","year":"2009","unstructured":"Noy NF, Shah NH, Whetzel PL, Dai B, Dorf M, Griffith N, Jonquet C, Rubin DL, Storey MA, Chute CG, Musen MA. BioPortal: ontologies and integrated data resources at the click of a mouse. Nucleic Acids Res. 2009;37(suppl 2):W170\u20133.","journal-title":"Nucleic Acids Res"}],"container-title":["Journal of Biomedical Semantics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13326-018-0181-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13326-018-0181-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13326-018-0181-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,3]],"date-time":"2025-07-03T16:14:25Z","timestamp":1751559265000},"score":1,"resource":{"primary":{"URL":"https:\/\/jbiomedsem.biomedcentral.com\/articles\/10.1186\/s13326-018-0181-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4,12]]},"references-count":112,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["181"],"URL":"https:\/\/doi.org\/10.1186\/s13326-018-0181-1","relation":{},"ISSN":["2041-1480"],"issn-type":[{"value":"2041-1480","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,4,12]]},"assertion":[{"value":"27 September 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 March 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 April 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare that they have no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interest"}},{"value":"The human raters have consented to make their anonymised judgements publically available.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Publisher\u2019s Note"}}],"article-number":"13"}}