{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T15:56:51Z","timestamp":1770220611169,"version":"3.49.0"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2019,1,8]],"date-time":"2019-01-08T00:00:00Z","timestamp":1546905600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1186\/s12859-018-2554-y","type":"journal-article","created":{"date-parts":[[2019,1,8]],"date-time":"2019-01-08T12:44:14Z","timestamp":1546951454000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":40,"title":["A model to predict the function of hypothetical proteins through a nine-point classification scoring schema"],"prefix":"10.1186","volume":"20","author":[{"given":"Johny","family":"Ijaq","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Girik","family":"Malik","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5023-7618","authenticated-orcid":false,"given":"Anuj","family":"Kumar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Partha Sarathi","family":"Das","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Narendra","family":"Meena","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Neeraja","family":"Bethi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vijayaraghava Seshadri","family":"Sundararajan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8535-278X","authenticated-orcid":false,"given":"Prashanth","family":"Suravajhala","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,1,8]]},"reference":[{"issue":"12","key":"2554_CR1","doi-asserted-by":"publisher","first-page":"1248","DOI":"10.1038\/nbt1210-1248","volume":"28","author":"M Uhlen","year":"2010","unstructured":"Uhlen M, et al. Towards a knowledge-based human protein atlas. Nat Biotechnol. 2010;28(12):1248\u201350.","journal-title":"Nat Biotechnol"},{"issue":"1","key":"2554_CR2","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1002\/cfg.66","volume":"2","author":"MY Galperin","year":"2001","unstructured":"Galperin MY. Conserved \u2018hypothetical\u2019 proteins: new hints and new puzzles. Comp Funct Genomics. 2001;2(1):14\u20138.","journal-title":"Comp Funct Genomics"},{"issue":"12","key":"2554_CR3","doi-asserted-by":"publisher","first-page":"1755","DOI":"10.1016\/j.str.2008.10.017","volume":"16","author":"G Nimrod","year":"2008","unstructured":"Nimrod G, et al. Detection of functionally important regions in \u201chypothetical proteins\u201d of known structure. Structure. 2008;16(12):1755\u201363.","journal-title":"Structure"},{"issue":"12","key":"2554_CR4","doi-asserted-by":"publisher","first-page":"e84263","DOI":"10.1371\/journal.pone.0084263","volume":"8","author":"M Shahbaaz","year":"2013","unstructured":"Shahbaaz M, et al. Functional annotation of conserved hypothetical proteins from Haemophilus influenzae Rd KW20. PLoS One. 2013;8(12):e84263.","journal-title":"PLoS One"},{"issue":"15","key":"2554_CR5","doi-asserted-by":"publisher","first-page":"722","DOI":"10.6026\/97320630008722","volume":"8","author":"R Mohan","year":"2012","unstructured":"Mohan R, Venugopal S. Computational structures and functional analysis of hypothetical proteins of Staphylococcus aureus. Bioinformation. 2012;8(15):722\u20138.","journal-title":"Bioinformation"},{"issue":"5","key":"2554_CR6","doi-asserted-by":"publisher","first-page":"379","DOI":"10.1093\/dnares\/dsi014","volume":"12","author":"M Murakami","year":"2005","unstructured":"Murakami M, et al. InCeP: intracellular pathway based on mKIAA protein-protein interactions. DNA Res. 2005;12(5):379\u201387.","journal-title":"DNA Res"},{"key":"2554_CR7","doi-asserted-by":"publisher","first-page":"119","DOI":"10.3389\/fgene.2015.00119","volume":"6","author":"J Ijaq","year":"2015","unstructured":"Ijaq J, et al. Annotation and curation of uncharacterized proteins-challenges. Front Genet. 2015;6:119.","journal-title":"Front Genet"},{"issue":"3","key":"2554_CR8","doi-asserted-by":"publisher","first-page":"e42","DOI":"10.1371\/journal.pcbi.0030042","volume":"3","author":"BA Shoemaker","year":"2007","unstructured":"Shoemaker BA, Panchenko AR. Deciphering protein\u2013protein interactions. Part I. Experimental techniques and databases. PLoS Comp Biol. 2007;3(3):e42.","journal-title":"PLoS Comp Biol"},{"key":"2554_CR9","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1186\/1471-2105-5-38","volume":"5","author":"LV Zhang","year":"2004","unstructured":"Zhang LV, et al. Predicting co-complexed protein pairs using genomic and proteomic data integration. BMC Bioinformatics. 2004;5:38.","journal-title":"BMC Bioinformatics"},{"issue":"5538","key":"2554_CR10","doi-asserted-by":"publisher","first-page":"2266","DOI":"10.1126\/science.1063566","volume":"293","author":"Y Ji","year":"2001","unstructured":"Ji Y, et al. Identification of critical staphylococcal genes using conditional phenotypes generated by antisense RNA. Science. 2001;293(5538):2266\u20139.","journal-title":"Science"},{"issue":"6920","key":"2554_CR11","doi-asserted-by":"publisher","first-page":"231","DOI":"10.1038\/nature01278","volume":"421","author":"RS Kamath","year":"2003","unstructured":"Kamath RS, et al. Systematic functional analysis of the Caenorhabditis elegans genome using RNAi. Nature. 2003;421(6920):231\u20137.","journal-title":"Nature"},{"issue":"6896","key":"2554_CR12","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1038\/nature00935","volume":"418","author":"G Giaever","year":"2002","unstructured":"Giaever G, et al. Functional profiling of the Saccharomyces cerevisiae genome. Nature. 2002;418(6896):387\u201391.","journal-title":"Nature"},{"issue":"3","key":"2554_CR13","doi-asserted-by":"publisher","first-page":"1009","DOI":"10.1073\/pnas.0606713104","volume":"104","author":"LA Gallagher","year":"2007","unstructured":"Gallagher LA, et al. A comprehensive transposon mutant library of Francisella novicida, a bioweapon surrogate. Proc Natl Acad Sci. 2007;104(3):1009\u201314.","journal-title":"Proc Natl Acad Sci"},{"issue":"6757","key":"2554_CR14","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1038\/47056","volume":"402","author":"AJ Enright","year":"1999","unstructured":"Enright AJ, et al. Protein interaction maps for complete genomes based on gene fusion events. Nature. 1999;402(6757):86\u201390.","journal-title":"Nature"},{"issue":"8","key":"2554_CR15","doi-asserted-by":"publisher","first-page":"335","DOI":"10.6026\/97320630001335","volume":"1","author":"S Sivashankari","year":"2006","unstructured":"Sivashankari S, Shanmughavel P. Functional annotation of hypothetical proteins-a review. Bioinformation. 2006;1(8):335\u20138.","journal-title":"Bioinformation"},{"key":"2554_CR16","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1016\/j.knosys.2018.03.027","volume":"151","author":"X Lei","year":"2018","unstructured":"Lei X, et al. Predicting essential proteins based on RNA-Seq, subcellular localization and GO annotation datasets. Knowl-Based Syst. 2018;151:136\u201347.","journal-title":"Knowl-Based Syst"},{"key":"2554_CR17","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/j.jtbi.2018.03.029","volume":"447","author":"M Li","year":"2018","unstructured":"Li M, et al. Identifying essential proteins based on sub-network partition and prioritization by integrating subcellular localization information. J Theor Biol. 2018;447:65\u201373.","journal-title":"J Theor Biol"},{"key":"2554_CR18","doi-asserted-by":"publisher","first-page":"44598","DOI":"10.1038\/srep44598","volume":"7","author":"J Sperschneider","year":"2017","unstructured":"Sperschneider J, et al. LOCALIZER: subcellular localization prediction of both plant and effector proteins in the plant cell. Sci Rep. 2017;7:44598.","journal-title":"Sci Rep"},{"issue":"13","key":"2554_CR19","doi-asserted-by":"publisher","first-page":"2185","DOI":"10.1093\/bioinformatics\/bty085","volume":"34","author":"C Zhen","year":"2018","unstructured":"Zhen C, et al. The lncLocator: a subcellular localization predictor for long non-coding RNAs based on a stacked ensemble classifier. Bioinformatics. 2018;34(13):2185\u201394.","journal-title":"Bioinformatics"},{"issue":"25","key":"2554_CR20","doi-asserted-by":"publisher","first-page":"14863","DOI":"10.1073\/pnas.95.25.14863","volume":"95","author":"MB Eisen","year":"1998","unstructured":"Eisen MB, et al. Cluster analysis and display of genome-wide expression patterns. Proc Natl Acad Sci U S A. 1998;95(25):14863\u20138.","journal-title":"Proc Natl Acad Sci U S A"},{"issue":"6","key":"2554_CR21","doi-asserted-by":"publisher","first-page":"947","DOI":"10.1089\/106652703322756168","volume":"10","author":"M Deng","year":"2003","unstructured":"Deng M, et al. Prediction of protein function using protein-protein interaction data. J Comput Biol. 2003;10(6):947\u201360.","journal-title":"J Comput Biol"},{"issue":"5","key":"2554_CR22","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1093\/bioinformatics\/17.5.455","volume":"17","author":"JR Bock","year":"2001","unstructured":"Bock JR, Gough DA. Predicting protein-protein interactions from primary structure. Bioinformatics. 2001;17(5):455\u201360.","journal-title":"Bioinformatics"},{"issue":"5","key":"2554_CR23","doi-asserted-by":"publisher","first-page":"1356","DOI":"10.1046\/j.1432-1033.2002.02767.x","volume":"269","author":"P Fariselli","year":"2002","unstructured":"Fariselli P, et al. Prediction of protein--protein interaction sites in heterocomplexes with neural networks. Eur J Biochem. 2002;269(5):1356\u201361.","journal-title":"Eur J Biochem"},{"issue":"14","key":"2554_CR24","doi-asserted-by":"publisher","first-page":"8348","DOI":"10.1073\/pnas.0832373100","volume":"100","author":"OG Troyanskaya","year":"2003","unstructured":"Troyanskaya OG, et al. A Bayesian framework for combining heterogeneous data sources for gene function prediction (in Saccharomyces cerevisiae). Proc Natl Acad Sci U S A. 2003;100(14):8348\u201353.","journal-title":"Proc Natl Acad Sci U S A"},{"issue":"5644","key":"2554_CR25","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1126\/science.1087361","volume":"302","author":"R Jansen","year":"2003","unstructured":"Jansen R, et al. A Bayesian networks approach for predicting protein\u2013protein interactions from genomic data. Science. 2003;302(5644):449\u201353.","journal-title":"Science"},{"issue":"24","key":"2554_CR26","doi-asserted-by":"publisher","first-page":"4394","DOI":"10.1093\/bioinformatics\/bti721","volume":"21","author":"XW Chen","year":"2005","unstructured":"Chen XW, Liu M. Prediction of protein\u2013protein interactions using random decision forest framework. Bioinformatics. 2005;21(24):4394\u2013400.","journal-title":"Bioinformatics"},{"issue":"5428","key":"2554_CR27","doi-asserted-by":"publisher","first-page":"751","DOI":"10.1126\/science.285.5428.751","volume":"285","author":"EM Marcotte","year":"1999","unstructured":"Marcotte EM, et al. Detecting protein function and protein\u2013protein interactions from genome sequences. Science. 1999;285(5428):751\u20133.","journal-title":"Science"},{"key":"2554_CR28","first-page":"81","volume-title":"Prediction of essential genes based on machine learning and information theoretic features","author":"D Nigatu","year":"2017","unstructured":"Nigatu D, Henkel W. Prediction of essential genes based on machine learning and information theoretic features. Proceedings of BIOSTEC 2017 \u2013 BIOINFORMATICS; 2017. p. 81\u201392."},{"issue":"2","key":"2554_CR29","doi-asserted-by":"publisher","first-page":"370","DOI":"10.1109\/TCBB.2015.2394487","volume":"14","author":"M Li","year":"2017","unstructured":"Li M, et al. United complex centrality for identification of essential proteins from PPI networks. IEEE\/ACM Trans Comput Biol Bioinform. 2017;14(2):370\u201380.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinform"},{"issue":"3","key":"2554_CR30","doi-asserted-by":"publisher","first-page":"731","DOI":"10.1109\/TCYB.2016.2524994","volume":"47","author":"Z-H You","year":"2017","unstructured":"You Z-H, et al. Highly efficient framework for predicting interactions between proteins. IEEE Trans Cybern. 2017;47(3):731\u201343.","journal-title":"IEEE Trans Cybern"},{"issue":"1","key":"2554_CR31","doi-asserted-by":"publisher","first-page":"34","DOI":"10.6026\/97320630008034","volume":"8","author":"P Suravajhala","year":"2012","unstructured":"Suravajhala P, Sundararajan VS. A classification scoring schema to validate protein interactors. Bioinformation. 2012;8(1):34\u20139.","journal-title":"Bioinformation"},{"key":"2554_CR32","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1186\/1471-2164-7-265","volume":"7","author":"AM Gustafson","year":"2006","unstructured":"Gustafson AM, et al. Towards the identification of essential genes using targeted genome sequencing and comparative analysis. BMC Genomics. 2006;7:265.","journal-title":"BMC Genomics"},{"issue":"3","key":"2554_CR33","doi-asserted-by":"publisher","first-page":"795","DOI":"10.1093\/nar\/gkq784","volume":"39","author":"J Deng","year":"2010","unstructured":"Deng J, et al. Investigating the predictability of essential genes across distantly related organisms using an integrative approach. Nucleic Acids Res. 2010;39(3):795\u2013807.","journal-title":"Nucleic Acids Res"},{"key":"2554_CR34","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1186\/1752-0509-6-87","volume":"6","author":"W Peng","year":"2012","unstructured":"Peng W, et al. Iteration method for predicting essential proteins based on orthology and protein-protein interaction networks. BMC Syst Biol. 2012;6:87.","journal-title":"BMC Syst Biol"},{"issue":"1\u20132","key":"2554_CR35","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1002\/prca.201200068","volume":"7","author":"J Wang","year":"2013","unstructured":"Wang J, et al. Computational approaches to predicting essential proteins: a survey. Proteomics Clin Appl. 2013;7(1\u20132):181\u201392.","journal-title":"Proteomics Clin Appl"},{"issue":"Suppl 8","key":"2554_CR36","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1186\/s12859-016-1115-5","volume":"17","author":"G Li","year":"2016","unstructured":"Li G, et al. Predicting essential proteins based on subcellular localization, orthology and PPI networks. BMC Bioinformatics. 2016;17(Suppl 8):279.","journal-title":"BMC Bioinformatics"},{"issue":"2\u20133","key":"2554_CR37","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1016\/S0014-5793(00)01199-6","volume":"468","author":"AJ Mighell","year":"2000","unstructured":"Mighell AJ, et al. Vertebrate pseudogenes. FEBS Lett. 2000;468(2\u20133):109\u201314.","journal-title":"FEBS Lett"},{"issue":"2","key":"2554_CR38","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/s11693-014-9148-4","volume":"8","author":"PR Shidhi","year":"2014","unstructured":"Shidhi PR, et al. Identifying pseudogenes from hypothetical proteins for making synthetic proteins. Syst Synth Biol. 2014;8(2):169\u201371.","journal-title":"Syst Synth Biol"},{"issue":"8","key":"2554_CR39","doi-asserted-by":"publisher","first-page":"1780","DOI":"10.1080\/07391102.2014.971429","volume":"33","author":"TC Fran\u00e7a","year":"2015","unstructured":"Fran\u00e7a TC. Homology modeling: an important tool for the drug discovery. J Biomol Struct Dyn. 2015;33(8):1780\u201393.","journal-title":"J Biomol Struct Dyn"},{"issue":"8","key":"2554_CR40","doi-asserted-by":"publisher","first-page":"1478","DOI":"10.1261\/rna.1951310","volume":"16","author":"H Jia","year":"2010","unstructured":"Jia H, et al. Genome-wide computational identification and manual annotation of human long noncoding RNA genes. RNA. 2010;16(8):1478\u201387.","journal-title":"RNA"},{"issue":"2","key":"2554_CR41","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1109\/72.80230","volume":"1","author":"SI Gallant","year":"1990","unstructured":"Gallant SI. Perceptron-based learning algorithms. IEEE Trans Neural Netw. 1990;1(2):179\u201391.","journal-title":"IEEE Trans Neural Netw"},{"issue":"3","key":"2554_CR42","doi-asserted-by":"publisher","first-page":"623","DOI":"10.1109\/72.572101","volume":"8","author":"M Muselli","year":"1997","unstructured":"Muselli M. On the convergence properties of the pocket algorithm. IEEE Trans Neural Netw. 1997;8(3):623\u20139.","journal-title":"IEEE Trans Neural Netw"},{"key":"2554_CR43","volume-title":"The WEKA Workbench. Online Appendix for \u201cData Mining: Practical Machine Learning Tools and Techniques\u201d, Morgan Kaufmann, Fourth Edition","author":"E Frank","year":"2016","unstructured":"Eibe Frank, et al. The WEKA Workbench. Online Appendix for \u201cData Mining: Practical Machine Learning Tools and Techniques\u201d, Morgan Kaufmann, Fourth Edition, 2016."},{"issue":"1","key":"2554_CR44","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1038\/nrc2036","volume":"7","author":"P Hu","year":"2007","unstructured":"Hu P, et al. Computational prediction of cancer-gene function. Nature Rev Cancer. 2007;7(1):23\u201334.","journal-title":"Nature Rev Cancer"},{"issue":"5","key":"2554_CR45","doi-asserted-by":"publisher","first-page":"412","DOI":"10.1093\/bioinformatics\/16.5.412","volume":"16","author":"P Baldi","year":"2000","unstructured":"Baldi P, et al. Assessing the accuracy of prediction algorithms for classification: an overview. Bioinformatics. 2000;16(5):412\u201324.","journal-title":"Bioinformatics"},{"issue":"2","key":"2554_CR46","doi-asserted-by":"publisher","first-page":"442","DOI":"10.1016\/0005-2795(75)90109-9","volume":"405","author":"BW Matthews","year":"1975","unstructured":"Matthews BW. Comparison of the predicted and observed secondary structure of T4 phage lysozyme. Biochim Biophys Acta. 1975;405(2):442\u201351.","journal-title":"Biochim Biophys Acta"},{"issue":"3","key":"2554_CR47","doi-asserted-by":"publisher","first-page":"e0118432","DOI":"10.1371\/journal.pone.0118432","volume":"10","author":"T Saito","year":"2015","unstructured":"Saito T, Rehmsmeier M. The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets. PLoS One. 2015;10(3):e0118432. \n                    https:\/\/doi.org\/10.1371\/journal.pone.0118432\n                    \n                  .","journal-title":"PLoS One"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-018-2554-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s12859-018-2554-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-018-2554-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,1,7]],"date-time":"2020-01-07T19:06:52Z","timestamp":1578424012000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-018-2554-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,1,8]]},"references-count":47,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2019,12]]}},"alternative-id":["2554"],"URL":"https:\/\/doi.org\/10.1186\/s12859-018-2554-y","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,1,8]]},"assertion":[{"value":"5 June 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 November 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 January 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Not applicable.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests whatsoever.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}},{"value":"Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Publisher\u2019s Note"}}],"article-number":"14"}}