{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,8]],"date-time":"2025-10-08T15:50:03Z","timestamp":1759938603307},"reference-count":41,"publisher":"Public Library of Science (PLoS)","issue":"2","license":[{"start":{"date-parts":[[2007,2,23]],"date-time":"2007-02-23T00:00:00Z","timestamp":1172188800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.0030020","type":"journal-article","created":{"date-parts":[[2007,2,20]],"date-time":"2007-02-20T18:40:16Z","timestamp":1171996816000},"page":"e20","update-policy":"http:\/\/dx.doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":53,"title":["Improving the Caenorhabditis elegans Genome Annotation Using Machine Learning"],"prefix":"10.1371","volume":"3","author":[{"given":"Gunnar","family":"R\u00e4tsch","sequence":"first","affiliation":[]},{"given":"S\u00f6ren","family":"Sonnenburg","sequence":"additional","affiliation":[]},{"given":"Jagan","family":"Srinivasan","sequence":"additional","affiliation":[]},{"given":"Hanh","family":"Witte","sequence":"additional","affiliation":[]},{"given":"Klaus-R","family":"M\u00fcller","sequence":"additional","affiliation":[]},{"given":"Ralf-J","family":"Sommer","sequence":"additional","affiliation":[]},{"given":"Bernhard","family":"Sch\u00f6lkopf","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2007,2,23]]},"reference":[{"key":"pcbi-0030020-b001","doi-asserted-by":"crossref","first-page":"D411","DOI":"10.1093\/nar\/gkh066","article-title":"Wormbase: A multi-species resource for nematode biology and genomics.","volume":"32","year":"2004","journal-title":"Nucleic Acids Res"},{"key":"pcbi-0030020-b002","doi-asserted-by":"crossref","first-page":"2012","DOI":"10.1126\/science.282.5396.2012","article-title":"Genome sequence of the Nematode Caenorhabditis elegans. A platform for investigating biology.","volume":"282","author":"The Caenorhabditis elegans sequencing consortium","year":"1998","journal-title":"Science"},{"key":"pcbi-0030020-b003","doi-asserted-by":"crossref","first-page":"D475","DOI":"10.1093\/nar\/gkj061","article-title":"Wormbase: Better software, richer content.","volume":"34","year":"2006","journal-title":"Nucleic Acids Res"},{"key":"pcbi-0030020-b004","doi-asserted-by":"crossref","unstructured":"VapnikV 1995 The nature of statistical learning theory New York Springer Verlag","DOI":"10.1007\/978-1-4757-2440-0"},{"key":"pcbi-0030020-b005","unstructured":"Sch\u00f6lkopfBSmolaAJ 2002 Learning with kernels Cambridge (Massachusetts) MIT Press"},{"key":"pcbi-0030020-b006","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1109\/72.914517","article-title":"An introduction to kernel-based learning algorithms.","volume":"12","year":"2001","journal-title":"IEEE Trans Neural Networks"},{"key":"pcbi-0030020-b007","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1089\/10665270050081405","article-title":"A discriminative framework for detecting remote protein homologies.","volume":"7","year":"2000","journal-title":"J Comput Biol"},{"key":"pcbi-0030020-b008","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1073\/pnas.97.1.262","article-title":"Knowledge-based analysis of microarray gene expression data by using support vector machines.","volume":"97","year":"2000","journal-title":"Proc Natl Acad Sci U S A"},{"key":"pcbi-0030020-b009","doi-asserted-by":"crossref","first-page":"799","DOI":"10.1093\/bioinformatics\/16.9.799","article-title":"Engineering support vector machine kernels that recognize translation initiation sites.","volume":"16","year":"2000","journal-title":"Bioinformatics"},{"key":"pcbi-0030020-b010","doi-asserted-by":"crossref","first-page":"2051","DOI":"10.1126\/science.293.5537.2051","article-title":"Machine learning for science: State of the art and future prospects.","volume":"293","year":"2001","journal-title":"Science"},{"key":"pcbi-0030020-b011","first-page":"329","article-title":"New methods for splice-site recognition.","volume":"2415","year":"2002","journal-title":"Proceedings of the International Conference on Artificial Neural Networks. Lect Notes Comp Sci"},{"key":"pcbi-0030020-b012","doi-asserted-by":"crossref","first-page":"2637","DOI":"10.1101\/gr.1679003","article-title":"Sequence information for the splicing of human pre-mRNA identified by support vector machine classification.","volume":"13","year":"2003","journal-title":"Genome Res"},{"key":"pcbi-0030020-b013","first-page":"134","article-title":"A generalized hidden Markov model for the recognition of human genes in DNA.","volume":"1996","year":"1996","journal-title":"ISMB"},{"key":"pcbi-0030020-b014","doi-asserted-by":"crossref","first-page":"78","DOI":"10.1006\/jmbi.1997.0951","article-title":"Prediction of complete gene structures in human genomic DNA.","volume":"268","year":"1997","journal-title":"J Mol Biol"},{"key":"pcbi-0030020-b015","unstructured":"KroghA 1997 Two methods for improving performance of a HMM and their application for gene finding. Proceedings of the Fifth International Conference on Intelligent Systems for Molecular Biology 21\u201326 June, 1997; Halkidiki, Greece. AAAI Press 179 186 Available: http:\/\/www.aaai.org\/Library\/ISMB\/ismb97contents.php. Accessed 24 January 2007."},{"key":"pcbi-0030020-b016","first-page":"1107","article-title":"Genemark.hmm: New solutions for gene finding.","volume":"25","year":"1998","journal-title":"Nucleic Acids Res"},{"key":"pcbi-0030020-b017","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1002\/9780470110607.ch13","article-title":"AceDB: A database for genome information.","volume":"39","year":"1998","journal-title":"Methods Biochem Anal"},{"key":"pcbi-0030020-b018","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1101\/gr.10.4.529","article-title":"Genie\u2013Gene finding in Drosophila melanogaster.","volume":"10","year":"2000","journal-title":"Genome Res"},{"key":"pcbi-0030020-b019","unstructured":"AltunYTsochantaridisIHofmannT 2003 Hidden Markov support vector machines. Proceedings of the 20th International Conference on Machine Learning 21\u201324 August 2003, Washington, D. C. 3 10"},{"key":"pcbi-0030020-b020","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1186\/1471-2105-5-59","article-title":"Gene finding in novel genomes.","volume":"5","year":"2004","journal-title":"BMC Bioinformatics"},{"key":"pcbi-0030020-b021","doi-asserted-by":"crossref","first-page":"i57","DOI":"10.1093\/bioinformatics\/bti1040","article-title":"ExonHunter: A comprehensive approach to gene finding.","volume":"21","year":"2005","journal-title":"Bioinformatics"},{"key":"pcbi-0030020-b022","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1038\/ng1140","article-title":"C. elegans ORFeome version 1.1: Experimental verification of the genome annotation and resource for proteome-scale protein expression.","volume":"34","year":"2003","journal-title":"Nat Genet"},{"key":"pcbi-0030020-b023","doi-asserted-by":"crossref","first-page":"656","DOI":"10.1101\/gr.229202","article-title":"Blat\u2014The blast-like alignment tool.","volume":"12","year":"2002","journal-title":"Genome Res"},{"key":"pcbi-0030020-b024","unstructured":"DavisJGoadrichM 2006 The relationship between precision-recall and roc curves. Technical report #1551 Madison (Wisconsin) University of Wisconsin Madison"},{"key":"pcbi-0030020-b025","doi-asserted-by":"crossref","first-page":"S9","DOI":"10.1186\/1471-2105-7-S1-S9","article-title":"Learning interpretable SVMs for biological sequence classification.","volume":"7","year":"2006","journal-title":"BMC Bioinformatics"},{"key":"pcbi-0030020-b026","doi-asserted-by":"crossref","unstructured":"SonnenburgSR\u00e4tschGRieckK 2007 Large-scale learning with string kernels. In: BottouLChapelleODeCosteDWestonJ Large-scale kernel machines Cambridge (Massachusetts) MIT Press 73 104 In press.","DOI":"10.7551\/mitpress\/7496.003.0006"},{"key":"pcbi-0030020-b027","doi-asserted-by":"crossref","first-page":"769","DOI":"10.1016\/j.molcel.2006.05.008","article-title":"Comparative analysis identifies exonic splicing regulatory sequences\u2014The complex definition of enhancers and silencers.","volume":"22","year":"2006","journal-title":"Mol Cell"},{"key":"pcbi-0030020-b028","first-page":"2","article-title":"The genome sequence of Caenorhabditis briggsae: A platform for comparative genomics.","volume":"1","year":"2003","journal-title":"PLoS Biol"},{"issue":"Database issue","key":"pcbi-0030020-b029","first-page":"D506","article-title":"Wormbase: New content and better access.","volume":"35","year":"2006","journal-title":"Nucleic Acids Res"},{"key":"pcbi-0030020-b030","doi-asserted-by":"crossref","first-page":"2553","DOI":"10.1093\/nar\/gkg359","article-title":"Limited microsynteny between the genomes of Pristionchus pacificus and Caenorhabditis elegans.","volume":"31","year":"2003","journal-title":"Nucleic Acids Res"},{"key":"pcbi-0030020-b031","doi-asserted-by":"crossref","first-page":"1333","DOI":"10.1073\/pnas.76.3.1333","article-title":"Analysis of the constancy of DNA sequences during development and evolution of the nematode Caenorhabditis elegans.","volume":"76","year":"1979","journal-title":"Proc Natl Acad Sci U S A"},{"key":"pcbi-0030020-b032","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1006\/jmbi.1995.0198","article-title":"Identification of protein coding regions in genomic DNA.","volume":"248","year":"1995","journal-title":"J Mol Biol"},{"key":"pcbi-0030020-b033","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1016\/0022-2836(92)90130-C","article-title":"Prediction of gene structure.","volume":"226","year":"1992","journal-title":"J Mol Biol"},{"key":"pcbi-0030020-b034","doi-asserted-by":"crossref","first-page":"9061","DOI":"10.1073\/pnas.93.17.9061","article-title":"Gene recognition via spliced sequence alignment.","volume":"93","year":"1996","journal-title":"Proc Natl Acad Sci U S A"},{"key":"pcbi-0030020-b035","doi-asserted-by":"crossref","first-page":"777","DOI":"10.1093\/bioinformatics\/18.6.777","article-title":"Exon discovery by genomic sequence alignment.","volume":"18","year":"2002","journal-title":"Bioinformatics"},{"key":"pcbi-0030020-b036","doi-asserted-by":"crossref","first-page":"307","DOI":"10.1016\/j.jmb.2004.01.026","article-title":"Identification of new human cadherin genes using a combination of protein motif search and gene finding methods.","volume":"337","year":"2004","journal-title":"J Mol Biol"},{"key":"pcbi-0030020-b037","doi-asserted-by":"crossref","first-page":"332","DOI":"10.1038\/ng0893-332","article-title":"dbEST\u2014Database for \u201cexpressed sequence tags.\u201d.","volume":"4","year":"1993","journal-title":"Nat Genet"},{"key":"pcbi-0030020-b038","first-page":"1531","article-title":"Large scale multiple kernel learning.","volume":"7","year":"2006","journal-title":"J Mach Learn Res"},{"key":"pcbi-0030020-b039","unstructured":"CPLEX Optimization 1994 Using the CPLEX Callable Library Incline Village (Nevada) CPLEX Optimization"},{"key":"pcbi-0030020-b040","doi-asserted-by":"crossref","first-page":"215","DOI":"10.1016\/j.scico.2003.12.005","article-title":"A discipline of dynamic programming over sequence data.","volume":"51","year":"2004","journal-title":"Sci Comput Program"},{"key":"pcbi-0030020-b041","doi-asserted-by":"crossref","unstructured":"RozenSSkaletskyH 2000 Primer3 on the WWW for general users and for biologist programmers. In: MisenerSKrawetzS Bioinformatics methods and protocols: Methods in molecular biology Totowa (New Jersey) Humana Press 365 386","DOI":"10.1385\/1-59259-192-2:365"}],"container-title":["PLoS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.0030020","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,11]],"date-time":"2024-02-11T03:06:15Z","timestamp":1707620775000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.0030020"}},"subtitle":[],"editor":[{"given":"Uwe","family":"Ohler","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2007,2,23]]},"references-count":41,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2007,2,23]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.0030020","relation":{},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2007,2,23]]}}}