{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T15:42:46Z","timestamp":1725982966324},"publisher-location":"Cham","reference-count":77,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319940298"},{"type":"electronic","value":"9783319940304"}],"license":[{"start":{"date-parts":[[2018,7,4]],"date-time":"2018-07-04T00:00:00Z","timestamp":1530662400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-319-94030-4_5","type":"book-chapter","created":{"date-parts":[[2018,7,3]],"date-time":"2018-07-03T12:22:48Z","timestamp":1530620568000},"page":"101-127","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Machine Learning Methods for the Protein Fold Recognition Problem"],"prefix":"10.1007","author":[{"given":"Katarzyna","family":"Stapor","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Irena","family":"Roterman-Konieczna","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Piotr","family":"Fabian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,7,4]]},"reference":[{"key":"5_CR1","unstructured":"Alpaydin, E.: Introduction to Machine Learning. MIT Press (2009)"},{"key":"5_CR2","doi-asserted-by":"crossref","unstructured":"Altschul, S.F., et al.: Gapped BLAST and PSI-BLAST: a new generation of protein database search programs. Nucleic Acids Res. 3389\u20133402 (1997)","DOI":"10.1093\/nar\/25.17.3389"},{"key":"5_CR3","doi-asserted-by":"crossref","unstructured":"Anfinsen, B.C.: Principles that govern the folding of protein chains. Science, 223\u2013230 (1973)","DOI":"10.1126\/science.181.4096.223"},{"key":"5_CR4","doi-asserted-by":"crossref","unstructured":"Apweiler, R., Bairoch, A., Wu, C.H., et al.: UniProt: the universal protein knowledgebase. Nucleic Acids Res. D115\u2013D119 (2004)","DOI":"10.1093\/nar\/gkh131"},{"key":"5_CR5","doi-asserted-by":"crossref","unstructured":"Banach, M., Konieczny, L., Roterman, I.: The late-stage intermediate. In: Protein Folding in Silico, pp. 21\u201338","DOI":"10.1533\/9781908818256.21"},{"key":"5_CR6","doi-asserted-by":"crossref","unstructured":"Banach, M., Konieczny, L., Roterman, I.: The fuzzy oil drop model, based on hydrophobicity density distribution, generalizes the influence of water environment on protein structure and function. J. Theor Biol. 6\u201317 (2014)","DOI":"10.1016\/j.jtbi.2014.05.007"},{"key":"5_CR7","doi-asserted-by":"crossref","unstructured":"Berman, H.M., et al. The protein databank. Nucleic Acids Res. 235\u2013242 (2000)","DOI":"10.1093\/nar\/28.1.235"},{"key":"5_CR8","volume-title":"Pattern Recognition and Machine Learning","author":"MCh Bishop","year":"2006","unstructured":"Bishop, MCh.: Pattern Recognition and Machine Learning. Springer, New York (2006)"},{"key":"5_CR9","doi-asserted-by":"crossref","unstructured":"Breiman, L.: Bagging predictors. Mach. Learn. 123\u2013140 (1996)","DOI":"10.1007\/BF00058655"},{"key":"5_CR10","doi-asserted-by":"crossref","unstructured":"Breiman, L.: Random Forests. Mach. Learn. 5\u201332 (2001)","DOI":"10.1023\/A:1010933404324"},{"key":"5_CR11","unstructured":"Breiman, L., Friedman, J., Olshen, R., Stone, C.: Classification and Regression Trees (1984)"},{"key":"5_CR12","doi-asserted-by":"crossref","unstructured":"Brown, G., et al.: Diversity creation methods: a survey and categorization. Inf. Fusion, 5\u201320 (2005)","DOI":"10.1016\/j.inffus.2004.04.004"},{"key":"5_CR13","doi-asserted-by":"crossref","unstructured":"Chan, H.S., Dill, K.: The protein folding problem. Phys. Today, 24\u201332 (1993)","DOI":"10.1063\/1.881371"},{"key":"5_CR14","doi-asserted-by":"crossref","unstructured":"Chen, D., Tian, X., Zhou, B., Gao, J.: ProFold: protein fold classification with additional structural features and a novel ensemble classifier. BioMed. Res. Int. (2016)","DOI":"10.1155\/2016\/6802832"},{"key":"5_CR15","doi-asserted-by":"crossref","unstructured":"Chen, K., Kurgan, L.: PFRES: protein fold classification by using evolutionary information and predicted secondary structure. Bioinformatics, 2843\u20132850 (2007)","DOI":"10.1093\/bioinformatics\/btm475"},{"key":"5_CR16","doi-asserted-by":"crossref","unstructured":"Cheng, J.: SCRATCH: a protein structure and structural feature prediction server. Nucleid Acid Res. 72\u201376 (2005)","DOI":"10.1093\/nar\/gki396"},{"key":"5_CR17","doi-asserted-by":"crossref","unstructured":"Chinnasamy, A., Sung, W.K., Mittal, A.: Protein structure and fold prediction using tree-augmented na\u00efve Bayesian classifier. In: Proceedings of PSB, Stanford CA (2004)","DOI":"10.1142\/S0219720005001302"},{"key":"5_CR18","doi-asserted-by":"crossref","unstructured":"Chmielnicki, W., Stapor, K.: Protein fold recognition with combined RDA-SVM classifier. Lecture Notes on Artificial Intelligence, pp. 162\u2013169 (2010)","DOI":"10.1007\/978-3-642-13769-3_20"},{"key":"5_CR19","doi-asserted-by":"crossref","unstructured":"Chmielnicki, W., Stapor, K.: A hybrid discriminative\/generative approach to protein fold recognition. Neurocomputing, 194\u2013198 (2012)","DOI":"10.1016\/j.neucom.2011.04.033"},{"key":"5_CR20","doi-asserted-by":"crossref","unstructured":"Chothia, C.: One thousand families for the molecular biologist. Nature, 543\u2013544 (1992)","DOI":"10.1038\/357543a0"},{"key":"5_CR21","doi-asserted-by":"crossref","unstructured":"Chou, K.C.: Prediction of protein cellular attributes using pseudo-amino acid composition. Proteins, 246\u2013255 (2001)","DOI":"10.1002\/prot.1035"},{"key":"5_CR22","doi-asserted-by":"crossref","unstructured":"Chou, K.C.: Pseudo amino acid composition and its applications in bioinformatics, proteomics and system biology. Curr. Proteomics, 262\u2013274","DOI":"10.2174\/157016409789973707"},{"key":"5_CR23","doi-asserted-by":"crossref","unstructured":"Clearly, J.G., Trigg, I.E.: K*: an instance-based learner using an entropic distance measure. Proc. Int. Conf. Mach. Learn. 108\u2013114 (1995)","DOI":"10.1016\/B978-1-55860-377-6.50022-0"},{"key":"5_CR24","unstructured":"Crammer, K., Singer, Y.: On the learnability and design of output codes for multiclass problems. In: 13th Computational Learning Theory Conference, pp. 35\u201346 (2000)"},{"key":"5_CR25","unstructured":"Craven, M.W., Mural, R.J., Hauser, L.J., Uberbacher, E.C.: Predicting protein folding classes without overly relying on homology. In: Proceedings of Intelligent Systems in Molecular Biology (ISMB), pp. 98\u2013106 (1995)"},{"key":"5_CR26","doi-asserted-by":"crossref","unstructured":"Damoulas, T., Girolami, M.: Probabilistic multi-class multi-kernel learning: on protein fold recognition and remote homology detection. Bioinformatics, 1264\u20131270 (2008)","DOI":"10.1093\/bioinformatics\/btn112"},{"key":"5_CR27","doi-asserted-by":"crossref","unstructured":"Denoeux, T.: A k-nearest neighbor classification rule based on Dempster-Shafer theory. IEEE Trans. Syst. Man Cybern. 804\u2013813 (1995)","DOI":"10.1109\/21.376493"},{"key":"5_CR28","doi-asserted-by":"crossref","unstructured":"Deschavanne, P., Tuffery, P.: Enhanced protein fold recognition using a structural alphabet. Proteins, 129\u2013137 (2009)","DOI":"10.1002\/prot.22324"},{"key":"5_CR29","doi-asserted-by":"crossref","unstructured":"Dietterich, T.G.: Ensemble methods in machine learning. In: 1st International Workshop on Multiple Classifier Systems, pp. 1\u201315 (2000)","DOI":"10.1007\/3-540-45014-9_1"},{"key":"5_CR30","doi-asserted-by":"crossref","unstructured":"Dill, K.A., Chan, H.S.: From Levinthal to pathways to funnels. Nat. Struct. Biol. 10\u201319 (1997)","DOI":"10.1038\/nsb0197-10"},{"key":"5_CR31","doi-asserted-by":"crossref","unstructured":"Ding, C.H., Dubchak, I.: Multi-class protein fold recognition using support vector machines and neural networks. Bioinformatics, pp. 349\u2013358 (2001)","DOI":"10.1093\/bioinformatics\/17.4.349"},{"key":"5_CR32","doi-asserted-by":"crossref","unstructured":"Dong, Q., Zhou, S., Guan, J.: A new taxonomy-based protein fold recognition approach based on autocross-covariance transformation. Bioinformatics, 2655\u20132662 (2009)","DOI":"10.1093\/bioinformatics\/btp500"},{"key":"5_CR33","doi-asserted-by":"crossref","unstructured":"Dubchak, I., Muchnik, I. Holbrook, S.R., Kim, S.H.: Prediction of protein folding class using global description of amino acid sequence. Proc. Natl. Acad. Sci. USA, 8700\u20138704 (1995)","DOI":"10.1073\/pnas.92.19.8700"},{"key":"5_CR34","doi-asserted-by":"crossref","unstructured":"Freund, Y., Shapire, R.: A decision-theoretic generalization of online learning and an application to boosting. J. Comput. Sys. Sci. 119\u2013139 (1997)","DOI":"10.1006\/jcss.1997.1504"},{"key":"5_CR35","doi-asserted-by":"crossref","unstructured":"Ghahramani, Z.: An introduction to Hidden Markov Models and Bayesian networks. Int. J. Pattern Recognit. Artif. Intell. 9\u201342","DOI":"10.1142\/9789812797605_0002"},{"key":"5_CR36","doi-asserted-by":"crossref","unstructured":"Guo, X., Gao, X.: A novel hierarchical ensemble classifier for protein fold recognition. Protein Eng. Des. Sel. 659\u2013664 (2008)","DOI":"10.1093\/protein\/gzn045"},{"key":"5_CR37","doi-asserted-by":"crossref","unstructured":"Hastie, T., Tibshirani, R., Friedman, J.: The Elements of Statistical Learning: Data Mining, Inference, and Prediction. Springer (2009)","DOI":"10.1007\/978-0-387-84858-7"},{"key":"5_CR38","doi-asserted-by":"crossref","unstructured":"Hinton, G.E., Osindero S., Teh, Y.: A fast learning algorithm for deep belief nets. Neural Comput. 1527\u20131554 (2006)","DOI":"10.1162\/neco.2006.18.7.1527"},{"key":"5_CR39","doi-asserted-by":"crossref","unstructured":"Huang, C.D., Lin, C.T., Pal, N.R.: Hierarchical learning architecture with automatic feature selection for multiclass protein fold classification. IEEE Trans. Nanobiosci. 221\u2013232 (2003)","DOI":"10.1109\/TNB.2003.820284"},{"key":"5_CR40","doi-asserted-by":"crossref","unstructured":"Ibrahim, W., Abadeh, M.S.: Extracting features from protein sequences to improve deep extreme learning machine for protein fold recognition. J. Theor. Biol. 1\u201315 (2017)","DOI":"10.1016\/j.jtbi.2017.03.023"},{"key":"5_CR41","doi-asserted-by":"crossref","unstructured":"Jo, T., Hou, J., Eickholt, J., Cheng, J.: Improving protein fold recognition by deep learning networks. Sci. Rep. (2015)","DOI":"10.1038\/srep17573"},{"key":"5_CR42","doi-asserted-by":"crossref","unstructured":"Jones, D.T.: Protein secondary structure prediction based on position-specific scoring matrices. J. Mol. Biol. 195\u2013202 (1999)","DOI":"10.1006\/jmbi.1999.3091"},{"key":"5_CR43","doi-asserted-by":"crossref","unstructured":"Jurkowski, W., Baster, Z., Dulak, D., Roterman, I.: The early-stage intermediate. In: Protein Folding in Silico, pp. 1\u201320 (2012)","DOI":"10.1533\/9781908818256.1"},{"key":"5_CR44","doi-asserted-by":"crossref","unstructured":"Kmiecik, S., Gront, D., Kolinski, M., Wieteska, L., Dawid, A.E., Kolinski, A.: Coarse-grained protein models and their applications. Chem. Rev. 7898\u20137936 (2016)","DOI":"10.1021\/acs.chemrev.6b00163"},{"key":"5_CR45","doi-asserted-by":"crossref","unstructured":"Konieczny, L., Roterman-Konieczna, I., Sp\u00f3lnik, P.: The structure and function of living organisms. Syst. Biol. 1\u201332 (2013)","DOI":"10.1007\/978-3-319-01336-7_1"},{"key":"5_CR46","doi-asserted-by":"crossref","unstructured":"Krupa, P., Sieradzan, A.K., Rackovsky, S., Baranowski, M., Olldziej, S., Scheraga, H.A., Liwo, A., Czaplewski, C.: Improvement of the treatment of loop structures in the UNRES force field by inclusion of coupling between backbone- and side-chain-local conformational states. J. Chem. Theory Comput. (2013)","DOI":"10.1021\/ct4004977"},{"key":"5_CR47","doi-asserted-by":"crossref","unstructured":"Leslie, C.S., et al.: Mismatch string kernels for discriminative protein classification. Bioinformatics, 467\u2013476 (2004)","DOI":"10.1093\/bioinformatics\/btg431"},{"key":"5_CR48","doi-asserted-by":"crossref","unstructured":"Levitt, M.: Accurate modeling of protein conformation by automatic segment matching. J. Mol. Biol. 507\u2013533 (1992)","DOI":"10.1016\/0022-2836(92)90964-L"},{"key":"5_CR49","doi-asserted-by":"crossref","unstructured":"Li, J., Wu, J., Chen, K.: PFP-RFSM: protein fold prediction by using random forests and sequence motifs. J. Biomed. Sci. Eng. 1161\u20131170 (2013)","DOI":"10.4236\/jbise.2013.612145"},{"key":"5_CR50","doi-asserted-by":"crossref","unstructured":"Liao, L., Noble, W.S.: Combining pairwise sequence similarity and support vector machines for detecting remote protein evolutionary and structural relationships. J. Comput. Biol. 857\u2013868 (2003)","DOI":"10.1089\/106652703322756113"},{"key":"5_CR51","doi-asserted-by":"crossref","unstructured":"Lin, K.L., Lin, C.Y., Huang, C.D., Chang, H.M., Yang, C.Y., Lin, C.T., Hsu, D.F.: Feature selection and combination criteria for improving accuracy in protein structure prediction. IEEE Trans. NanoBiosci. 186\u2013196 (2007)","DOI":"10.1109\/TNB.2007.897482"},{"key":"5_CR52","doi-asserted-by":"crossref","unstructured":"Lindahl, E., Elofsson, A.: Identification of related proteins on family, superfamily and fold level. J. Mol. Biol. 613\u2013625 (2000)","DOI":"10.1006\/jmbi.1999.3377"},{"key":"5_CR53","doi-asserted-by":"crossref","unstructured":"Lo Conte, L., Ailey, B., Hubbard, T.J.P., Brenner, S.E., Murzin, A.G., Chothia, C.: SCOP: a structural classification of protein database. Nucleic Acids Res. 257\u2013259 (2000)","DOI":"10.1093\/nar\/28.1.257"},{"key":"5_CR54","doi-asserted-by":"crossref","unstructured":"Marchler-Bauer, A., et al.: CDD: a conserved domain database for interactive domain family analysis. Nucleid Acid Res. D237\u2013D240 (2007)","DOI":"10.1093\/nar\/gkl951"},{"key":"5_CR55","doi-asserted-by":"crossref","unstructured":"Nanni, L.: A novel ensemble of classifiers for protein fold recognition. Neurocomputing, 2434\u20132437 (2006)","DOI":"10.1016\/j.neucom.2006.01.026"},{"key":"5_CR56","unstructured":"Okun, O.: Protein fold recognition with k-local hyperplane distance nearest neighbor algorithm. In: Proceedings of the Second European Workshop on Data Mining and Text Mining in Bioinformatics, pp. 51\u201357 (2004)"},{"key":"5_CR57","doi-asserted-by":"crossref","unstructured":"Pedersen, J.T., Moult, J.: Genetic algorithms for protein structure prediction. Curr. Opin. Struct. Biol. 227\u2013231 (1996)","DOI":"10.1016\/S0959-440X(96)80079-0"},{"key":"5_CR58","doi-asserted-by":"crossref","unstructured":"Rangwala, H., Karypis, G.: Profile-based direct kernels for remote homology detection and fold recognition. Bioinformatics, 4239\u20134247 (2005)","DOI":"10.21236\/ADA439489"},{"key":"5_CR59","doi-asserted-by":"crossref","unstructured":"Rashid, M.A., Newton, M.A.H., Hoque, M.T., Sattar, A.: Mixing energy models in genetic algorithms for on-lattice protein structure prediction. BioMed. Res. Int. (2013)","DOI":"10.1155\/2013\/924137"},{"key":"5_CR60","doi-asserted-by":"crossref","unstructured":"Rokach, L.: Ensemble-based classifiers. Artif. Intell. Rev. 1\u201339 (2010)","DOI":"10.1007\/s10462-009-9124-7"},{"key":"5_CR61","unstructured":"Roterman, I., Bryli\u0144ski, M., Konieczny, L., Jurkowski, W.: Early-stage protein folding\u2014in silico model. Recent Adv. Struct. Biol. (2007)"},{"key":"5_CR62","doi-asserted-by":"crossref","unstructured":"Saigo, H., et al.: Protein homology detection using string alignment kernels. Bioinformatics, 1682\u20131689 (2004)","DOI":"10.1093\/bioinformatics\/bth141"},{"key":"5_CR63","doi-asserted-by":"crossref","unstructured":"Sali, A., Blundell, T.L.: Comparative protein modelling by satisfaction of spatial restraints. J. Mol. Biol. 779\u2013815 (1993)","DOI":"10.1006\/jmbi.1993.1626"},{"key":"5_CR64","doi-asserted-by":"crossref","unstructured":"Schaffer, A., et al.: Improving the accuracy of PSI-BLAST protein database searches with composition-based statistics and other refinements. Nucleid Acids Res. 2994\u20133005 (2001)","DOI":"10.1093\/nar\/29.14.2994"},{"key":"5_CR65","doi-asserted-by":"crossref","unstructured":"Shamim, M., et al.: Support vector machine-based classification of protein folds using the structural properties of amino acid residues and amino acid residue pairs. Bioinformatics, 3320\u20133327 (2007)","DOI":"10.1093\/bioinformatics\/btm527"},{"key":"5_CR66","doi-asserted-by":"crossref","unstructured":"Shapire, R.: The strength of weak learnability. Mach. Learn. 197\u2013227 (1995)","DOI":"10.1007\/BF00116037"},{"key":"5_CR67","doi-asserted-by":"crossref","unstructured":"Sharma, A., Lyons, J., Dehzangi, A., Paliwal, K.: A feature extraction technique using bi-gram probabilities of position specific scoring matrix for protein fold recognition. J. Theor. Biol. 41\u201346 (2013)","DOI":"10.1016\/j.jtbi.2012.12.008"},{"key":"5_CR68","doi-asserted-by":"crossref","unstructured":"Shawe-Taylor, J., Cristiannini, N.: Kernel Methods for Pattern Analysis. Cambridge University Press (2004)","DOI":"10.1017\/CBO9780511809682"},{"key":"5_CR69","doi-asserted-by":"crossref","unstructured":"Shen, H.B., Chou, K.C.: Predicting protein fold pattern with functional domain and sequential evolution information. J. Theor. Biol. 441\u2013446 (2009)","DOI":"10.1016\/j.jtbi.2008.10.007"},{"key":"5_CR70","volume-title":"Classification methods in computer vision (in Polish)","author":"K Stapor","year":"2011","unstructured":"Stapor, K.: Classification methods in computer vision (in Polish). Scientific Publishing House PWN, Warsaw (2011)"},{"key":"5_CR71","doi-asserted-by":"crossref","unstructured":"Unger, R., Moult, J.: Genetic algorithms for protein folding simulations. J. Mol. Biol. 75\u201381 (1993)","DOI":"10.1006\/jmbi.1993.1258"},{"key":"5_CR72","doi-asserted-by":"crossref","unstructured":"Wei, L., Liao, M., Gao, X., Zou, Q.: Enhanced protein fold prediction method through a novel feature extraction technique. IEEE Trans. Nanobiosci. 649\u2013659","DOI":"10.1109\/TNB.2015.2450233"},{"key":"5_CR73","doi-asserted-by":"crossref","unstructured":"Wei, L., Zou, Q.: Recent progress in machine learning-based methods for protein fold recognition. Int. J. Mol. Sci. (2016)","DOI":"10.3390\/ijms17122118"},{"key":"5_CR74","doi-asserted-by":"crossref","unstructured":"Yang, J.-Y., Chen, X.: Improving taxonomy-based protein fold recognition by using global and local features. Proteins, 2053\u20132064 (2011)","DOI":"10.1002\/prot.23025"},{"key":"5_CR75","doi-asserted-by":"crossref","unstructured":"Ying, Y., Huang, K., Campbell, C.: 2009. Enhanced protein fold recognition through a novel data integration approach. BMC Bioinformat. 267\u2013287","DOI":"10.1186\/1471-2105-10-267"},{"key":"5_CR76","unstructured":"Yu, L., Liu, H.: Feature selection for high-dimensional data: a fast correlation-based filter solution. In: Proceedings of 10th International Conference Machine Learning, pp. 856\u2013863"},{"key":"5_CR77","doi-asserted-by":"crossref","unstructured":"Zouhal, L.M., Denoeux, T.: An evidence-theoretic kNN rule with parameter optimization. IEEE Trans. Syst. Man Cybern. 263\u2013271 (1998)","DOI":"10.1109\/5326.669565"}],"container-title":["Intelligent Systems Reference Library","Machine Learning Paradigms"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-94030-4_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,20]],"date-time":"2019-10-20T08:31:23Z","timestamp":1571560283000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-94030-4_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,7,4]]},"ISBN":["9783319940298","9783319940304"],"references-count":77,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-94030-4_5","relation":{},"ISSN":["1868-4394","1868-4408"],"issn-type":[{"type":"print","value":"1868-4394"},{"type":"electronic","value":"1868-4408"}],"subject":[],"published":{"date-parts":[[2018,7,4]]}}}