{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,6]],"date-time":"2026-04-06T22:05:11Z","timestamp":1775513111042,"version":"3.50.1"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"1","funder":[{"DOI":"10.13039\/501100001659","name":"Deutsche Forschungsgemeinschaft","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100001659","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s12859-017-1884-5","type":"journal-article","created":{"date-parts":[[2017,11,9]],"date-time":"2017-11-09T02:10:18Z","timestamp":1510193418000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":46,"title":["Sequence-based information-theoretic features for gene essentiality prediction"],"prefix":"10.1186","volume":"18","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8796-136X","authenticated-orcid":false,"given":"Dawit","family":"Nigatu","sequence":"first","affiliation":[]},{"given":"Patrick","family":"Sobetzko","sequence":"additional","affiliation":[]},{"given":"Malik","family":"Yousef","sequence":"additional","affiliation":[]},{"given":"Werner","family":"Henkel","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,11,9]]},"reference":[{"issue":"1","key":"1884_CR1","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1146\/annurev.genom.1.1.99","volume":"1","author":"EV Koonin","year":"2000","unstructured":"Koonin EV. How many genes can make a cell: The minimal-gene-set concept 1. Annu Rev Genomics Hum Genet. 2000; 1(1):99\u2013116.","journal-title":"Annu Rev Genomics Hum Genet"},{"issue":"3","key":"1884_CR2","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1016\/0014-5793(95)00233-Y","volume":"362","author":"M Itaya","year":"1995","unstructured":"Itaya M. An estimation of minimal genome size required for life. FEBS Lett. 1995; 362(3):257\u201360.","journal-title":"FEBS Lett"},{"issue":"1","key":"1884_CR3","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/S0163-7258(02)00222-X","volume":"95","author":"AF Chalker","year":"2002","unstructured":"Chalker AF, Lunsford RD. Rational identification of new antibacterial drug targets that are essential for viability using a genomics-based approach. Pharmacol Ther. 2002; 95(1):1\u201320.","journal-title":"Pharmacol Ther"},{"issue":"12","key":"1884_CR4","doi-asserted-by":"crossref","first-page":"7213","DOI":"10.1073\/pnas.1231432100","volume":"100","author":"G Lamichhane","year":"2003","unstructured":"Lamichhane G, Zignol M, Blades NJ, Geiman DE, Dougherty A, Grosset J, Broman KW, Bishai WR. A postgenomic method for predicting essential genes at subsaturation levels of mutagenesis: application to mycobacterium tuberculosis. Proc Natl Acad Sci. 2003; 100(12):7213\u20138.","journal-title":"Proc Natl Acad Sci"},{"issue":"6280","key":"1884_CR5","doi-asserted-by":"crossref","first-page":"6253","DOI":"10.1126\/science.aad6253","volume":"351","author":"CA Hutchison","year":"2016","unstructured":"Hutchison CA, Chuang RY, Noskov VN, Assad-Garcia N, Deerinck TJ, Ellisman MH, Gill J, Kannan K, Karas BJ, Ma L, et al. Design and synthesis of a minimal bacterial genome. Science. 2016; 351(6280):6253.","journal-title":"Science"},{"issue":"23","key":"1884_CR6","doi-asserted-by":"crossref","first-page":"7926","DOI":"10.1128\/JB.186.23.7926-7935.2004","volume":"186","author":"NR Salama","year":"2004","unstructured":"Salama NR, Shepherd B, Falkow S. Global transposon mutagenesis and essential gene analysis of helicobacter pylori. J Bacteriol. 2004; 186(23):7926\u201335.","journal-title":"J Bacteriol"},{"key":"1884_CR7","doi-asserted-by":"crossref","unstructured":"Chen L, Ge X, Xu P. Identifying essential Streptococcus sanguinis genes using genome-wide deletion mutation. Methods Mol Biol; 1279:15\u201323.","DOI":"10.1007\/978-1-4939-2398-4_2"},{"issue":"6896","key":"1884_CR8","doi-asserted-by":"crossref","first-page":"387","DOI":"10.1038\/nature00935","volume":"418","author":"G Giaever","year":"2002","unstructured":"Giaever G, Chu AM, Ni L, Connelly C, Riles L, Veronneau S, Dow S, Lucau-Danila A, Anderson K, Andre B, et al. Functional profiling of the saccharomyces cerevisiae genome. Nature. 2002; 418(6896):387\u201391.","journal-title":"Nature"},{"issue":"3","key":"1884_CR9","doi-asserted-by":"crossref","first-page":"217","DOI":"10.1111\/j.1440-1711.2005.01332.x","volume":"83","author":"LM Cullen","year":"2005","unstructured":"Cullen LM, Arndt GM. Genome-wide screening for gene function using RNAi in mammalian cells. Immunol Cell Biol. 2005; 83(3):217\u201323.","journal-title":"Immunol Cell Biol"},{"issue":"10","key":"1884_CR10","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1016\/j.tim.2009.08.005","volume":"17","author":"MA D\u2019Elia","year":"2009","unstructured":"D\u2019Elia MA, Pereira MP, Brown ED. Are essential genes really essential?Trends Microbiol. 2009; 17(10):433\u20138.","journal-title":"Trends Microbiol"},{"issue":"19","key":"1884_CR11","doi-asserted-by":"crossref","first-page":"10268","DOI":"10.1073\/pnas.93.19.10268","volume":"93","author":"AR Mushegian","year":"1996","unstructured":"Mushegian AR, Koonin EV. A minimal gene set for cellular life derived by comparison of complete bacterial genomes. Proc Natl Acad Sci. 1996; 93(19):10268\u201373.","journal-title":"Proc Natl Acad Sci"},{"key":"1884_CR12","first-page":"75","volume":"7","author":"X Zhang","year":"2016","unstructured":"Zhang X, Acencio ML, Lemke N. Predicting essential genes and proteins based on machine learning and network topological features: A comprehensive review. Front Physiol. 2016; 7:75. doi: 10.3389\/fphys.2016.00075 .","journal-title":"Front Physiol"},{"issue":"D1","key":"1884_CR13","doi-asserted-by":"crossref","first-page":"574","DOI":"10.1093\/nar\/gkt1131","volume":"42","author":"H Luo","year":"2014","unstructured":"Luo H, Lin Y, Gao F, Zhang CT, Zhang R. Deg 10, an update of the database of essential genes that includes both protein-coding genes and noncoding genomic elements. Nucleic Acids Res. 2014; 42(D1):574\u201380.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"1884_CR14","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2164-14-1","volume":"14","author":"YN Ye","year":"2013","unstructured":"Ye YN, Hua ZG, Huang J, Rao N, Guo FB. CEG: a database of essential gene clusters. BMC Genomics. 2013; 14(1):1.","journal-title":"BMC Genomics"},{"issue":"D1","key":"1884_CR15","doi-asserted-by":"crossref","first-page":"901","DOI":"10.1093\/nar\/gkr986","volume":"40","author":"WH Chen","year":"2012","unstructured":"Chen WH, Minguez P, Lercher MJ, Bork P. OGEE: an online gene essentiality database. Nucleic Acids Res. 2012; 40(D1):901\u20136.","journal-title":"Nucleic Acids Res"},{"key":"1884_CR16","doi-asserted-by":"crossref","first-page":"4564","DOI":"10.4238\/2014.June.17.8","volume":"13","author":"L Ning","year":"2014","unstructured":"Ning L, Lin H, Ding H, Huang J, Rao N, Guo F. Predicting bacterial essential genes using only sequence composition information. Genet Mol Res. 2014; 13:4564\u201372.","journal-title":"Genet Mol Res"},{"issue":"4","key":"1884_CR17","doi-asserted-by":"crossref","first-page":"460","DOI":"10.1039\/C3IB40241J","volume":"6","author":"K Song","year":"2014","unstructured":"Song K, Tong T, Wu F. Predicting essential genes in prokaryotic genomes using a linear method: Zupls. Integr Biol. 2014; 6(4):460\u20139.","journal-title":"Integr Biol"},{"issue":"3","key":"1884_CR18","doi-asserted-by":"crossref","first-page":"577","DOI":"10.1039\/C6MB00806B","volume":"13","author":"Y Yu","year":"2017","unstructured":"Yu Y, Yang L, Liu Z, Zhu C. Gene essentiality prediction based on fractal features and machine learning. Mol BioSyst. 2017; 13(3):577\u201384.","journal-title":"Mol BioSyst"},{"issue":"1","key":"1884_CR19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1752-0509-4-56","volume":"4","author":"K Plaimas","year":"2010","unstructured":"Plaimas K, Eils R, K\u00f6nig R. Identifying essential genes in bacterial metabolic networks with machine learning methods. BMC Syst Biol. 2010; 4(1):1.","journal-title":"BMC Syst Biol"},{"issue":"1","key":"1884_CR20","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2105-10-290","volume":"10","author":"ML Acencio","year":"2009","unstructured":"Acencio ML, Lemke N. Towards the prediction of essential genes by integration of network topology, cellular localization and biological process information. BMC Bioinformatics. 2009; 10(1):1.","journal-title":"BMC Bioinformatics"},{"key":"1884_CR21","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1016\/j.compbiolchem.2014.01.011","volume":"50","author":"Y Lu","year":"2014","unstructured":"Lu Y, Deng J, Rhodes JC, Lu H, Lu LJ. Predicting essential genes for identifying potential drug targets in aspergillus fumigatus. Comput Biol Chem. 2014; 50:29\u201340.","journal-title":"Comput Biol Chem"},{"issue":"1","key":"1884_CR22","doi-asserted-by":"crossref","first-page":"86805","DOI":"10.1371\/journal.pone.0086805","volume":"9","author":"J Cheng","year":"2014","unstructured":"Cheng J, Xu Z, Wu W, Zhao L, Li X, Liu Y, Tao S. Training set selection for the prediction of essential genes. PloS ONE. 2014; 9(1):86805.","journal-title":"PloS ONE"},{"issue":"8","key":"1884_CR23","doi-asserted-by":"crossref","first-page":"72343","DOI":"10.1371\/journal.pone.0072343","volume":"8","author":"W Wei","year":"2013","unstructured":"Wei W, Ning LW, Ye YN, Guo FB. Geptop: a gene essentiality prediction tool for sequenced bacterial genomes based on orthology and phylogeny. PloS ONE. 2013; 8(8):72343.","journal-title":"PloS ONE"},{"issue":"1","key":"1884_CR24","doi-asserted-by":"crossref","first-page":"910","DOI":"10.1186\/1471-2164-14-910","volume":"14","author":"J Cheng","year":"2013","unstructured":"Cheng J, Wu W, Zhang Y, Li X, Jiang X, Wei G, Tao S. A new computational strategy for predicting essential genes. BMC Genomics. 2013; 14(1):910.","journal-title":"BMC Genomics"},{"issue":"3","key":"1884_CR25","doi-asserted-by":"crossref","first-page":"795","DOI":"10.1093\/nar\/gkq784","volume":"39","author":"J Deng","year":"2011","unstructured":"Deng J, Deng L, Su S, Zhang M, Lin X, Wei L, Minai AA, Hassett DJ, Lu LJ. Investigating the predictability of essential genes across distantly related organisms using an integrative approach. Nucleic Acids Res. 2011; 39(3):795\u2013807.","journal-title":"Nucleic Acids Res"},{"key":"1884_CR26","volume-title":"2011 10th International Conference on Machine Learning and Applications and Workshops","author":"K Palaniappan","year":"2011","unstructured":"Palaniappan K, Mukherjee S. Predicting \u201cessential\u201d genes across microbial genomes: a machine learning approach. In: 2011 10th International Conference on Machine Learning and Applications and Workshops. Honolulu: IEEE: 2011. p. 189\u201394. doi: 10.1109\/ICMLA.2011.114 ."},{"issue":"3","key":"1884_CR27","first-page":"0174638","volume":"12","author":"X Liu","year":"2017","unstructured":"Liu X, Wang BJ, Xu L, Tang HL, Xu GQ. Selection of key sequence-based features for prediction of essential genes in 31 diverse bacterial species. PloS ONE. 2017; 12(3):0174638.","journal-title":"PloS ONE"},{"key":"1884_CR28","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1016\/j.jtbi.2017.01.031","volume":"418","author":"Y Li","year":"2017","unstructured":"Li Y, Lv Y, Li X, Xiao W, Li C. Sequence comparison and essential gene identification with new inter-nucleotide distance sequences. J Theor Biol. 2017; 418:84\u201393.","journal-title":"J Theor Biol"},{"issue":"12","key":"1884_CR29","doi-asserted-by":"crossref","first-page":"1758","DOI":"10.1093\/bioinformatics\/btx055","volume":"33","author":"FB Guo","year":"2017","unstructured":"Guo FB, Dong C, Hua HL, Liu S, Luo H, Zhang HW, Jin YT, Zhang KY. Accurate prediction of human essential genes using only nucleotide composition and association information. Bioinformatics. 2017; 33(12):1758\u201364.","journal-title":"Bioinformatics"},{"issue":"3","key":"1884_CR30","doi-asserted-by":"crossref","first-page":"1281","DOI":"10.1093\/nar\/15.3.1281","volume":"15","author":"PM Sharp","year":"1987","unstructured":"Sharp PM, Li WH. The codon adaptation index-a measure of directional synonymous codon usage bias, and its potential applications. Nucleic Acids Res. 1987; 15(3):1281\u201395.","journal-title":"Nucleic Acids Res"},{"issue":"suppl_2","key":"1884_CR31","doi-asserted-by":"crossref","first-page":"174","DOI":"10.1093\/nar\/gkp278","volume":"37","author":"Z Xu","year":"2009","unstructured":"Xu Z, Hao B. Cvtree update: a newly designed phylogenetic study platform using composition vectors and whole genomes. Nucleic Acids Res. 2009; 37(suppl_2):174\u20138.","journal-title":"Nucleic Acids Res"},{"key":"1884_CR32","doi-asserted-by":"crossref","unstructured":"Nigatu D, Henkel W. Prediction of essential genes based on machine learning and information theoretic features. In: Proceedings of the 10th International Joint Conference on Biomedical Engineering Systems and Technologies - Volume 3: BIOINFORMATICS, (BIOSTEC 2017): 2017. p. 81\u201392. doi: 10.5220\/0006165700810092 .","DOI":"10.5220\/0006165700810092"},{"issue":"1","key":"1884_CR33","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/s13637-015-0035-4","volume":"2016","author":"D Nigatu","year":"2016","unstructured":"Nigatu D, Henkel W, Sobetzko P, Muskhelishvili G. Relationship between digital information and thermodynamic stability in bacterial genomes. EURASIP J Bioinforma Syst Biol. 2016; 2016(1):1.","journal-title":"EURASIP J Bioinforma Syst Biol"},{"issue":"1","key":"1884_CR34","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2105-9-1","volume":"9","author":"M Bauer","year":"2008","unstructured":"Bauer M, Schuster SM, Sayood K. The average mutual information profile as a genomic signature. BMC Bioinformatics. 2008; 9(1):1.","journal-title":"BMC Bioinformatics"},{"issue":"9","key":"1884_CR35","doi-asserted-by":"crossref","first-page":"1055","DOI":"10.1038\/nbt861","volume":"21","author":"SV Date","year":"2003","unstructured":"Date SV, Marcotte EM. Discovery of uncharacterized cellular systems by genome-wide analysis of functional linkages. Nat Biotechnol. 2003; 21(9):1055\u201362.","journal-title":"Nat Biotechnol"},{"key":"1884_CR36","doi-asserted-by":"crossref","unstructured":"Hagenauer J, Dawy Z, G\u00f6bel B, Hanus P, Mueller J. Genomic analysis using methods from information theory. In: Information Theory Workshop. IEEE: 2004. p. 55\u20139. doi: 10.1109\/ITW.2004.1405274 .","DOI":"10.1109\/ITW.2004.1405274"},{"key":"1884_CR37","volume-title":"Elements of Information Theory","author":"TM Cover","year":"2012","unstructured":"Cover TM, Thomas JA. Elements of Information Theory. Hoboken: Wiley; 2012."},{"key":"1884_CR38","doi-asserted-by":"crossref","first-page":"623","DOI":"10.1002\/j.1538-7305.1948.tb00917.x","volume":"27","author":"CE Shannon","year":"1948","unstructured":"Shannon CE. A mathematical theory of communication. Bell Syst Tech J. 1948; 27:623\u201356. doi: 10.1002\/j.1538-7305.1948.tb00917.x .","journal-title":"Bell Syst Tech J"},{"issue":"4","key":"1884_CR39","doi-asserted-by":"crossref","first-page":"1460","DOI":"10.1073\/pnas.95.4.1460","volume":"95","author":"J SantaLucia","year":"1998","unstructured":"SantaLucia J. A unified view of polymer, dumbbell, and oligonucleotide DNA nearest-neighbor thermodynamics. Proc Natl Acad Sci. 1998; 95(4):1460\u20135.","journal-title":"Proc Natl Acad Sci"},{"issue":"182-192","key":"1884_CR40","first-page":"13","volume":"8","author":"GJ Lidstone","year":"1920","unstructured":"Lidstone GJ. Note on the general case of the bayes-laplace formula for inductive or a posteriori probabilities. Trans Fac Actuaries. 1920; 8(182-192):13.","journal-title":"Trans Fac Actuaries"},{"key":"1884_CR41","doi-asserted-by":"crossref","first-page":"291","DOI":"10.1007\/11557067_24","volume":"3692","author":"D Dalevi","year":"2005","unstructured":"Dalevi D, Dubhashi D. The peres-shields order estimator for fixed and variable length markov models with applications to DNA sequence similarity. Lect Notes Comput Sci. 2005; 3692:291.","journal-title":"Lect Notes Comput Sci"},{"issue":"3","key":"1884_CR42","doi-asserted-by":"crossref","first-page":"488","DOI":"10.1017\/S0021900200048294","volume":"12","author":"H Tong","year":"1975","unstructured":"Tong H. Determination of the order of a Markov chain by Akaike\u2019s information criterion. J Appl Probab. 1975; 12(3):488\u201397.","journal-title":"J Appl Probab"},{"issue":"3","key":"1884_CR43","doi-asserted-by":"crossref","first-page":"243","DOI":"10.2307\/1267787","volume":"23","author":"RW Katz","year":"1981","unstructured":"Katz RW. On some criteria for estimating the order of a markov chain. Technometrics. 1981; 23(3):243\u20139.","journal-title":"Technometrics"},{"key":"1884_CR44","unstructured":"Peres Y, Shields P. Two new Markov order estimators. ArXiv preprint http:\/\/arxiv.org\/abs\/math\/0506080. 2005."},{"issue":"1","key":"1884_CR45","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1007\/s11009-008-9107-1","volume":"13","author":"M Men\u00e9ndez","year":"2011","unstructured":"Men\u00e9ndez M, Pardo L, Pardo M, Zografos K. Testing the order of markov dependence in DNA sequences. Methodol Comput Appl Probab. 2011; 13(1):59\u201374.","journal-title":"Methodol Comput Appl Probab"},{"issue":"7","key":"1884_CR46","doi-asserted-by":"crossref","first-page":"1593","DOI":"10.1016\/j.physa.2012.12.017","volume":"392","author":"M Papapetrou","year":"2013","unstructured":"Papapetrou M, Kugiumtzis D. Markov chain order estimation with conditional mutual information. Phys A Stat Mech Appl. 2013; 392(7):1593\u2013601. doi: 10.1016\/j.physa.2012.12.017 . 1301.0148 .","journal-title":"Phys A Stat Mech Appl"},{"issue":"1","key":"1884_CR47","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1214\/aoms\/1177729694","volume":"22","author":"S Kullback","year":"1951","unstructured":"Kullback S, Leibler RA. On information and sufficiency. Ann Math Stat. 1951; 22(1):79\u201386.","journal-title":"Ann Math Stat"},{"key":"1884_CR48","doi-asserted-by":"crossref","unstructured":"Berthold MR, Cebron N, Dill F, Gabriel TR, K\u00f6tter T, Meinl T, Ohl P, Sieb C, Thiel K, Wiswedel B. KNIME: the Konstanz Information Miner. In: Studies in classification, data analysis, and knowledge organization (GfKL 2007), vol. 11. Springer: 2007. p. 319\u201326.","DOI":"10.1007\/978-3-540-78246-9_38"},{"issue":"24","key":"1884_CR49","doi-asserted-by":"crossref","first-page":"5339","DOI":"10.1093\/nar\/gkf691","volume":"30","author":"C Condon","year":"2002","unstructured":"Condon C, Putzer H. The phylogenetic distribution of bacterial ribonucleases. Nucleic Acids Res. 2002; 30(24):5339\u201346.","journal-title":"Nucleic Acids Res"},{"issue":"5","key":"1884_CR50","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1089\/dna.1995.14.359","volume":"14","author":"Y ZHAO","year":"1995","unstructured":"ZHAO Y, LIEBERMAN HB. Schizosaccharomyces pombe: a model for molecular studies of eukaryotic genes. DNA Cell Biol. 1995; 14(5):359\u201371.","journal-title":"DNA Cell Biol"},{"issue":"1","key":"1884_CR51","doi-asserted-by":"crossref","first-page":"170","DOI":"10.1186\/s12859-017-1584-1","volume":"18","author":"M Yousef","year":"2017","unstructured":"Yousef M, Khalifa W, Acar \u0130E, Allmer J. Microrna categorization using sequence motifs and k-mers. BMC Bioinformatics. 2017; 18(1):170.","journal-title":"BMC Bioinformatics"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-017-1884-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,5]],"date-time":"2019-10-05T18:11:49Z","timestamp":1570299109000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-017-1884-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,11,9]]},"references-count":51,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["1884"],"URL":"https:\/\/doi.org\/10.1186\/s12859-017-1884-5","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,11,9]]},"article-number":"473"}}