{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T02:46:12Z","timestamp":1773801972627,"version":"3.50.1"},"update-to":[{"DOI":"10.1371\/journal.pcbi.1006390","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2018,8,23]],"date-time":"2018-08-23T00:00:00Z","timestamp":1534982400000}}],"reference-count":48,"publisher":"Public Library of Science (PLoS)","issue":"8","license":[{"start":{"date-parts":[[2018,8,13]],"date-time":"2018-08-13T00:00:00Z","timestamp":1534118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/publicdomain\/zero\/1.0\/"}],"funder":[{"DOI":"10.13039\/100000092","name":"U.S. National Library of Medicine","doi-asserted-by":"publisher","award":["Intramural Research Program"],"award-info":[{"award-number":["Intramural Research Program"]}],"id":[{"id":"10.13039\/100000092","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["UniProt 5U41HG007822-02"],"award-info":[{"award-number":["UniProt 5U41HG007822-02"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000051","name":"National Human Genome Research Institute","doi-asserted-by":"publisher","award":["U41HG007823"],"award-info":[{"award-number":["U41HG007823"]}],"id":[{"id":"10.13039\/100000051","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100004410","name":"European Molecular Biology Organization","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004410","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1006390","type":"journal-article","created":{"date-parts":[[2018,8,13]],"date-time":"2018-08-13T17:23:54Z","timestamp":1534181034000},"page":"e1006390","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":36,"title":["Scaling up data curation using deep learning: An application to literature triage in genomic variation resources"],"prefix":"10.1371","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2015-3939","authenticated-orcid":true,"given":"Kyubum","family":"Lee","sequence":"first","affiliation":[]},{"given":"Maria Livia","family":"Famiglietti","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0978-0309","authenticated-orcid":true,"given":"Aoife","family":"McMahon","sequence":"additional","affiliation":[]},{"given":"Chih-Hsuan","family":"Wei","sequence":"additional","affiliation":[]},{"given":"Jacqueline Ann Langdon","family":"MacArthur","sequence":"additional","affiliation":[]},{"given":"Sylvain","family":"Poux","sequence":"additional","affiliation":[]},{"given":"Lionel","family":"Breuza","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2148-9135","authenticated-orcid":true,"given":"Alan","family":"Bridge","sequence":"additional","affiliation":[]},{"given":"Fiona","family":"Cunningham","sequence":"additional","affiliation":[]},{"given":"Ioannis","family":"Xenarios","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9998-916X","authenticated-orcid":true,"given":"Zhiyong","family":"Lu","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2018,8,13]]},"reference":[{"issue":"D1","key":"ref1","doi-asserted-by":"crossref","first-page":"D158","DOI":"10.1093\/nar\/gkw1099","article-title":"UniProt: the universal protein knowledgebase","volume":"45","author":"C The UniProt","year":"2017","journal-title":"Nucleic Acids Res"},{"issue":"8","key":"ref2","doi-asserted-by":"crossref","first-page":"927","DOI":"10.1002\/humu.22594","article-title":"Genetic variations and diseases in UniProtKB\/Swiss-Prot: the ins and outs of expert manual curation","volume":"35","author":"ML Famiglietti","year":"2014","journal-title":"Hum Mutat"},{"issue":"D1","key":"ref3","doi-asserted-by":"crossref","first-page":"D896","DOI":"10.1093\/nar\/gkw1133","article-title":"The new NHGRI-EBI Catalog of published genome-wide association studies (GWAS Catalog)","volume":"45","author":"J MacArthur","year":"2017","journal-title":"Nucleic Acids Res"},{"key":"ref4","article-title":"Curation accuracy of model organism databases","author":"IM Keseler","year":"2014","journal-title":"Database (Oxford)"},{"issue":"13","key":"ref5","doi-asserted-by":"crossref","first-page":"i41","DOI":"10.1093\/bioinformatics\/btm229","article-title":"Manual curation is not sufficient for annotation of genomic databases","volume":"23","author":"WA Baumgartner Jr","year":"2007","journal-title":"Bioinformatics"},{"issue":"7576","key":"ref6","doi-asserted-by":"crossref","first-page":"S16","DOI":"10.1038\/527S16a","article-title":"Perspective: Sustaining the big-data ecosystem","volume":"527","author":"PE Bourne","year":"2015","journal-title":"Nature"},{"key":"ref7","first-page":"bas040","article-title":"Text mining in the biocuration workflow: applications for literature curation at WormBase, dictyBase and TAIR","author":"K Van Auken","year":"2012","journal-title":"Database (Oxford)"},{"issue":"11","key":"ref8","doi-asserted-by":"crossref","first-page":"1433","DOI":"10.1093\/bioinformatics\/btt156","article-title":"tmVar: a text mining approach for extracting sequence variants in biomedical literature","volume":"29","author":"CH Wei","year":"2013","journal-title":"Bioinformatics"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"bas005","DOI":"10.1093\/database\/bas005","article-title":"A hybrid human and machine resource curation pipeline for the Neuroscience Information Framework","volume":"2012","author":"AE Bandrowski","year":"2012","journal-title":"Database (Oxford)"},{"issue":"5","key":"ref10","doi-asserted-by":"crossref","first-page":"842","DOI":"10.1016\/j.jbi.2012.04.006","article-title":"A SNPshot of PubMed to associate genetic variants with drugs, diseases, and adverse reactions","volume":"45","author":"J Hakenberg","year":"2012","journal-title":"J Biomed Inform"},{"issue":"3","key":"ref11","doi-asserted-by":"crossref","first-page":"408","DOI":"10.1093\/bioinformatics\/btq667","article-title":"Toward an automatic method for extracting cancer- and other disease-related point mutations from the biomedical literature","volume":"27","author":"E Doughty","year":"2011","journal-title":"Bioinformatics"},{"key":"ref12","article-title":"Hybrid curation of gene-mutation relations combining automated extraction and crowdsourcing","author":"JD Burger","year":"2014","journal-title":"Database (Oxford)"},{"key":"ref13","article-title":"Mutation extraction tools can be combined for robust recognition of genetic variants in the literature","volume":"3","author":"AJ Yepes","year":"2014","journal-title":"F1000Research"},{"issue":"1","key":"ref14","doi-asserted-by":"crossref","first-page":"68","DOI":"10.1186\/s12911-016-0294-3","article-title":"Establishing a baseline for literature mining human genetic variants and their relationships to disease cohorts","volume":"16","author":"KM Verspoor","year":"2016","journal-title":"BMC medical informatics and decision making"},{"issue":"21","key":"ref15","doi-asserted-by":"crossref","first-page":"3454","DOI":"10.1093\/bioinformatics\/btx439","article-title":"On expert curation and scalability: UniProtKB\/Swiss-Prot as a case study","volume":"33","author":"S Poux","year":"2017","journal-title":"Bioinformatics"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"bas020","DOI":"10.1093\/database\/bas020","article-title":"Text mining for the biocuration workflow","volume":"2012","author":"L Hirschman","year":"2012","journal-title":"Database (Oxford)"},{"key":"ref17","article-title":"Biocuration workflows and text mining: overview of the BioCreative 2012 Workshop Track II","author":"Z Lu","year":"2012","journal-title":"Database"},{"issue":"3","key":"ref18","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1038\/nrc1299","article-title":"A census of human cancer genes","volume":"4","author":"PA Futreal","year":"2004","journal-title":"Nature Reviews Cancer"},{"key":"ref19","unstructured":"The GWAS Catalog\u2014Methods. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"https:\/\/www.ebi.ac.uk\/gwas\/docs\/methods\" xlink:type=\"simple\">https:\/\/www.ebi.ac.uk\/gwas\/docs\/methods<\/ext-link>."},{"issue":"12","key":"ref20","doi-asserted-by":"crossref","first-page":"e115892","DOI":"10.1371\/journal.pone.0115892","article-title":"Machine learning for biomedical literature triage","volume":"9","author":"H Almeida","year":"2014","journal-title":"PLoS One"},{"key":"ref21","article-title":"Curation of characterized glycoside hydrolases of fungal origin","author":"C Murphy","year":"2011","journal-title":"Database"},{"key":"ref22","doi-asserted-by":"crossref","DOI":"10.3115\/v1\/D14-1181","article-title":"Convolutional neural networks for sentence classification","author":"Y Kim","year":"2014"},{"key":"ref23","article-title":"A sensitivity analysis of (and practitioners&apos; guide to) convolutional neural networks for sentence classification","author":"Y Zhang","year":"2015"},{"issue":"22","key":"ref24","doi-asserted-by":"crossref","first-page":"3444","DOI":"10.1093\/bioinformatics\/btw486","article-title":"Drug drug interaction extraction from biomedical literature using syntax convolutional neural network","volume":"32","author":"Z Zhao","year":"2016","journal-title":"Bioinformatics"},{"key":"ref25","author":"R Johnson","year":"2017"},{"key":"ref26","author":"S Lai","year":"2015"},{"key":"ref27","article-title":"Classifying relations by ranking with convolutional neural networks","author":"CNd Santos","year":"2015"},{"issue":"1","key":"ref28","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1186\/s12859-018-2029-1","article-title":"Deep learning of mutation-gene-drug relations from the literature","volume":"19","author":"K Lee","year":"2018","journal-title":"BMC Bioinformatics"},{"key":"ref29","doi-asserted-by":"crossref","unstructured":"Amato F, Boselli R, Cesarini M, Mercorio F, Mezzanzanica M, Moscato V, et al., editors. Challenge: Processing web texts for classifying job offers. Semantic Computing (ICSC), 2015 IEEE International Conference on; 2015: IEEE.","DOI":"10.1109\/ICOSC.2015.7050852"},{"issue":"Oct","key":"ref30","first-page":"2825","article-title":"Scikit-learn: Machine learning in Python","volume":"12","author":"F Pedregosa","year":"2011","journal-title":"Journal of machine learning research"},{"key":"ref31","article-title":"tmVar 2.0: Integrating genomic variant information from literature with dbSNP and ClinVar for precision medicine","author":"CH Wei","year":"2017","journal-title":"Bioinformatics"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"W518","DOI":"10.1093\/nar\/gkt441","article-title":"PubTator: a web-based text mining tool for assisting biocuration","volume":"41","author":"CH Wei","year":"2013","journal-title":"Nucleic Acids Res"},{"issue":"3","key":"ref33","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1007\/s10676-013-9321-6","article-title":"Bias in algorithmic filtering and personalization","volume":"15","author":"E Bozdag","year":"2013","journal-title":"Ethics and information technology"},{"key":"ref34","article-title":"Understanding intermediate layers using linear classifier probes","author":"G Alain","year":"2016"},{"key":"ref35","article-title":"Opening the black box of deep neural networks via information","author":"R Shwartz-Ziv","year":"2017"},{"key":"ref36","doi-asserted-by":"crossref","first-page":"bau016","DOI":"10.1093\/database\/bau016","article-title":"Expert curation in UniProtKB: a case study on dealing with conflicting and erroneous data","volume":"2014","author":"S Poux","year":"2014","journal-title":"Database (Oxford)"},{"key":"ref37","unstructured":"UniProtKB\/Swiss-Prot human data Download. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"http:\/\/ftp:\/\/ftp.uniprot.org\/pub\/databases\/uniprot\/current_release\/knowledgebase\/taxonomic_divisions\" xlink:type=\"simple\">ftp:\/\/ftp.uniprot.org\/pub\/databases\/uniprot\/current_release\/knowledgebase\/taxonomic_divisions<\/ext-link>."},{"key":"ref38","unstructured":"Information NCfB. Entrez Programming Utilities 2010. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"https:\/\/eutils.ncbi.nlm.nih.gov\/entrez\/eutils\/\" xlink:type=\"simple\">https:\/\/eutils.ncbi.nlm.nih.gov\/entrez\/eutils\/<\/ext-link>."},{"key":"ref39","unstructured":"LeCun Y, Bengio Y. Convolutional networks for images, speech, and time series."},{"key":"ref40","author":"D Ciregan","year":"2012"},{"issue":"1","key":"ref41","doi-asserted-by":"crossref","first-page":"98","DOI":"10.1109\/72.554195","article-title":"Face recognition: A convolutional neural-network approach","volume":"8","author":"S Lawrence","year":"1997","journal-title":"IEEE transactions on neural networks"},{"issue":"11","key":"ref42","doi-asserted-by":"crossref","first-page":"2278","DOI":"10.1109\/5.726791","article-title":"Gradient-based learning applied to document recognition","volume":"86","author":"Y LeCun","year":"1998","journal-title":"Proceedings of the IEEE"},{"issue":"Aug","key":"ref43","first-page":"2493","article-title":"Natural language processing (almost) from scratch","volume":"12","author":"R Collobert","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref44","unstructured":"Chollet F. Keras 2015. Available from: <ext-link xmlns:xlink=\"http:\/\/www.w3.org\/1999\/xlink\" ext-link-type=\"uri\" xlink:href=\"https:\/\/keras.io\" xlink:type=\"simple\">https:\/\/keras.io<\/ext-link>."},{"key":"ref45","article-title":"Tensorflow: Large-scale machine learning on heterogeneous distributed systems","author":"M Abadi","year":"2016"},{"key":"ref46","first-page":"39","author":"S Pyysalo","year":"2013"},{"key":"ref47","author":"B Chiu","year":"2016"},{"key":"ref48","article-title":"Distributed representations of words and phrases and their compositionality","author":"T Mikolov","year":"2013","journal-title":"Advances in neural information processing systems"}],"updated-by":[{"DOI":"10.1371\/journal.pcbi.1006390","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2018,8,23]],"date-time":"2018-08-23T00:00:00Z","timestamp":1534982400000}}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/dx.plos.org\/10.1371\/journal.pcbi.1006390","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,4]],"date-time":"2023-09-04T09:50:55Z","timestamp":1693821055000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1006390"}},"subtitle":[],"editor":[{"given":"Rong","family":"Xu","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2018,8,13]]},"references-count":48,"journal-issue":{"issue":"8","published-online":{"date-parts":[[2018,8,13]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1006390","relation":{"new_version":[{"id-type":"doi","id":"10.1371\/journal.pcbi.1006390","asserted-by":"object"}]},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,8,13]]}}}