{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,10]],"date-time":"2025-04-10T05:11:31Z","timestamp":1744261891848},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2013,7,3]],"date-time":"2013-07-03T00:00:00Z","timestamp":1372809600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2013,12]]},"DOI":"10.1186\/1471-2105-14-213","type":"journal-article","created":{"date-parts":[[2013,7,3]],"date-time":"2013-07-03T08:14:13Z","timestamp":1372839253000},"source":"Crossref","is-referenced-by-count":14,"title":["PFClust: a novel parameter free clustering algorithm"],"prefix":"10.1186","volume":"14","author":[{"given":"Lazaros","family":"Mavridis","sequence":"first","affiliation":[]},{"given":"Neetika","family":"Nath","sequence":"additional","affiliation":[]},{"given":"John BO","family":"Mitchell","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,7,3]]},"reference":[{"key":"5991_CR1","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1186\/1471-2105-5-45","volume":"5","author":"TJ Harlow","year":"2004","unstructured":"Harlow TJ, Gogarten JP, Ragan MA: A hybrid clustering approach to recognition of protein families in 114 microbial genomes. BMC Bioinformatics. 2004, 5: 45-10.1186\/1471-2105-5-45.","journal-title":"BMC Bioinformatics"},{"key":"5991_CR2","volume-title":"Technical Report 1530, Department of Computer Sciences","author":"X Zhu","year":"2005","unstructured":"Zhu X: Semi-Supervised Learning Literature Survey. Technical Report 1530, Department of Computer Sciences. 2005, Madison: University of Wisconsin, \n                    http:\/\/pages.cs.wisc.edu\/~jerryzhu\/pub\/ssl_survey.pdf\n                    \n                  ,"},{"key":"5991_CR3","first-page":"34","volume":"30","author":"NN Pise","year":"2008","unstructured":"Pise NN, Kulkarni P: A Survey of Semi-Supervised Learning Methods. International Conference on Computational Intelligence and Security. 2008, 30: 34-[\n                    http:\/\/ieeexplore.ieee.org\/stamp\/stamp.jsp?tp=&arnumber=4724730\n                    \n                  ]","journal-title":"International Conference on Computational Intelligence and Security"},{"key":"5991_CR4","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"A Jain","year":"1991","unstructured":"Jain A, Murty M, Flynn P: Data clustering: a review. ACM Comput Surv. 1991, 31: 264-323.","journal-title":"ACM Comput Surv"},{"key":"5991_CR5","doi-asserted-by":"publisher","first-page":"3201","DOI":"10.1093\/bioinformatics\/bti517","volume":"21","author":"J Handl","year":"2005","unstructured":"Handl J, Knowles J, Kell DB: Computational cluster validation in post-genomic data analysis. Bioinformatics. 2005, 21: 3201-3212. 10.1093\/bioinformatics\/bti517.","journal-title":"Bioinformatics"},{"key":"5991_CR6","doi-asserted-by":"publisher","first-page":"373","DOI":"10.1093\/comjnl\/9.4.373","volume":"9","author":"BGN Lance","year":"1967","unstructured":"Lance BGN, Williams WT: A general theory of classificatory sorting strategies 1. Hierarchical systems. Comput J. 1967, 9: 373-380. 10.1093\/comjnl\/9.4.373.","journal-title":"Comput J"},{"key":"5991_CR7","doi-asserted-by":"publisher","first-page":"651","DOI":"10.1016\/j.patrec.2009.09.011","volume":"31","author":"AK Jain","year":"2010","unstructured":"Jain AK: Data clustering: 50 years beyond K-means. Pattern Recognition Letters. 2010, 31: 651-666. 10.1016\/j.patrec.2009.09.011.","journal-title":"Pattern Recognition Letters"},{"key":"5991_CR8","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1111\/1467-9868.00293","volume":"63","author":"R Tibshirani","year":"2001","unstructured":"Tibshirani R, Walther G, Hastie T: Estimating the number of clusters in a data set via the gap statistic. Journal of the Royal Statistical Society Series B Statistical Methodology. 2001, 63: 411-423. 10.1111\/1467-9868.00293.","journal-title":"Journal of the Royal Statistical Society Series B Statistical Methodology"},{"key":"5991_CR9","doi-asserted-by":"publisher","first-page":"462","DOI":"10.1186\/1471-2105-9-462","volume":"9","author":"R Giancarlo","year":"2008","unstructured":"Giancarlo R, Scaturro D, Utro F: Computational cluster validation for microarray data analysis: experimental assessment of Clest, Consensus Clustering, Figure of Merit. Gap Statistics and Model Explorer. BMC Bioinformatics. 2008, 9: 462-10.1186\/1471-2105-9-462.","journal-title":"BMC Bioinformatics"},{"key":"5991_CR10","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"P Rousseeuw","year":"1987","unstructured":"Rousseeuw P: Silhouettes: a graphical aid to the interpretation and validation of cluster analysis. J Comput Appl Math. 1987, 20: 53-65.","journal-title":"J Comput Appl Math"},{"key":"5991_CR11","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1080\/01969727308546046","volume":"3","author":"JC Dunn","year":"1973","unstructured":"Dunn JC: A Fuzzy Relative of the ISODATA Process and Its Use in Detecting Compact Well-Separated Clusters. J Cybernetics. 1973, 3: 32-57. 10.1080\/01969727308546046.","journal-title":"J Cybernetics"},{"key":"5991_CR12","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1109\/3477.678624","volume":"28","author":"JC Bezdek","year":"1998","unstructured":"Bezdek JC, Pal NR: Some new indexes of cluster validity. IEEE transactions on systems, man, and cybernetics. Part B, Cybernetics. 1998, 28: 15-10.1109\/3477.658574.","journal-title":"IEEE transactions on systems, man, and cybernetics. Part B, Cybernetics"},{"key":"5991_CR13","doi-asserted-by":"publisher","first-page":"846","DOI":"10.1080\/01621459.1971.10482356","volume":"66","author":"WM Rand","year":"1971","unstructured":"Rand WM: Objective Criteria for the Evaluation of Clustering Methods. J Am Stat Assoc. 1971, 66: 846-850. 10.1080\/01621459.1971.10482356.","journal-title":"J Am Stat Assoc"},{"key":"5991_CR14","volume-title":"PICS: Parameter-free Identification of Cohesive Subgroups in Large Attributed Graphs","author":"L Akoglu","year":"2012","unstructured":"Akoglu L, Tong H, Meeder B, Faloutsos C: PICS: Parameter-free Identification of Cohesive Subgroups in Large Attributed Graphs. 2012, Anaheim, CA: SDM"},{"key":"5991_CR15","doi-asserted-by":"publisher","first-page":"498","DOI":"10.2174\/138920310794109094","volume":"11","author":"SR Shenoy","year":"2010","unstructured":"Shenoy SR, Jayaram B: Proteins: sequence to structure and function-current status. Curr Protein Pept Sci. 2010, 11: 498-514. 10.2174\/138920310794109094.","journal-title":"Curr Protein Pept Sci"},{"key":"5991_CR16","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1093\/nar\/30.1.35","volume":"30","author":"CH Wu","year":"2002","unstructured":"Wu CH, Huang H, Arminski L, Castro-Alvear J, Chen Y, Hu ZZ, Ledley RS, Lewis KC, Mewes HW, Orcutt BC, Suzek BE, Tsugita A, Vinayaka CR, Yeh LSL, Zhang J, Barker WC: The Protein Information Resource: an integrated public resource of functional annotation of proteins. Nucleic Acids Res. 2002, 30: 35-37. 10.1093\/nar\/30.1.35.","journal-title":"Nucleic Acids Res"},{"key":"5991_CR17","doi-asserted-by":"publisher","first-page":"D211","DOI":"10.1093\/nar\/gkp985","volume":"38","author":"RD Finn","year":"2010","unstructured":"Finn RD, Mistry J, Tate J, Coggill P, Heger A, Pollington JE, Gavin OL, Gunasekaran P, Ceric G, Forslund K, Holm L, Sonnhammer ELL, Eddy SR, Bateman A: The Pfam protein families database. Nucleic Acids Res. 2010, 38: D211-D222. 10.1093\/nar\/gkp985.","journal-title":"Nucleic Acids Res"},{"key":"5991_CR18","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1093\/nar\/28.1.235","volume":"28","author":"HM Berman","year":"2000","unstructured":"Berman HM, Westbrook J, Feng Z, Gilliland G, Bhat TN, Weissig H, Shindyalov IN, Bourne PE: The Protein Data Bank. Nucleic Acids Res. 2000, 28: 235-242. 10.1093\/nar\/28.1.235.","journal-title":"Nucleic Acids Res"},{"key":"5991_CR19","doi-asserted-by":"publisher","first-page":"D310","DOI":"10.1093\/nar\/gkn877","volume":"37","author":"AL Cuff","year":"2009","unstructured":"Cuff AL, Sillitoe I, Lewis T, Redfern OC, Garratt R, Thornton J, Orengo CA: The CATH classification revisited-architectures reviewed and new ways to characterize structural divergence in superfamilies. Nucleic Acids Res. 2009, 37: D310-314. 10.1093\/nar\/gkn877.","journal-title":"Nucleic Acids Res"},{"key":"5991_CR20","first-page":"536","volume":"247","author":"AG Murzin","year":"1995","unstructured":"Murzin AG, Brenner SE, Hubbard T, Chothia C: SCOP: a structural classification of proteins database for the investigation of sequences and structures. J Mol Biol. 1995, 247: 536-540.","journal-title":"J Mol Biol"},{"key":"5991_CR21","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1107\/S0108767307035623","volume":"64","author":"HM Berman","year":"2008","unstructured":"Berman HM: The Protein Data Bank: a historical perspective. Acta Crystallographica Section A Foundations of Crystallography. 2008, 64: 88-95. 10.1107\/S0108767307035623.","journal-title":"Acta Crystallographica Section A Foundations of Crystallography"},{"key":"5991_CR22","doi-asserted-by":"publisher","DOI":"10.1002\/9780470316801","volume-title":"Finding Groups in Data: An Introduction to Cluster Analysis","author":"L Kaufman","year":"1990","unstructured":"Kaufman L, Rousseeuw PJ: Finding Groups in Data: An Introduction to Cluster Analysis. 1990, New York: Wiley"},{"key":"5991_CR23","doi-asserted-by":"publisher","first-page":"351","DOI":"10.1016\/S0957-4174(02)00185-9","volume":"24","author":"C Wei","year":"2003","unstructured":"Wei C: Empirical Comparison of Fast Clustering Algorithms for Large Data Sets. Experts Systems with Applications. 2003, 24: 351-363. 10.1016\/S0957-4174(02)00185-9.","journal-title":"Experts Systems with Applications"},{"key":"5991_CR24","first-page":"226","volume-title":"A Density-Based Algorithm for Discovering Clusters in Large Spatial Databases with Noise. Proceedings of 2nd International Conference on Knowledge Discovery and Data Mining","author":"M Ester","year":"1996","unstructured":"Ester M, Kriegel HP, Sander J, Xu X: A Density-Based Algorithm for Discovering Clusters in Large Spatial Databases with Noise. Proceedings of 2nd International Conference on Knowledge Discovery and Data Mining. 1996, 226-231. KDD-96"},{"key":"5991_CR25","doi-asserted-by":"publisher","first-page":"611","DOI":"10.1198\/016214502760047131","volume":"97","author":"C Fraley","year":"2002","unstructured":"Fraley C, Raftery AE: Model-based clustering, discriminant analysis, and density estimation. J Am Stat Assoc. 2002, 97: 611-631. 10.1198\/016214502760047131.","journal-title":"J Am Stat Assoc"},{"key":"5991_CR26","unstructured":"R: A language and environment for statistical computing; R development core team. 2005, Vienna, Austria: R foundation for statistical computing, \n                    http:\/\/www.r-project.org\/\n                    \n                  ,"},{"key":"5991_CR27","first-page":"281","volume-title":"Pac Symp Biocomput","author":"L Mavridis","year":"2010","unstructured":"Mavridis L, Ritchie DW: 3D-Blast: 3D protein structure alignment, comparison, and classification using spherical polar fourier correlations. Pac Symp Biocomput. 2010, 281-292."},{"key":"5991_CR28","doi-asserted-by":"publisher","first-page":"530","DOI":"10.1002\/prot.23218","volume":"80","author":"L Mavridis","year":"2011","unstructured":"Mavridis L, Ghoorah AW, Venkatraman V, Ritchie DW: Representing and comparing protein folds and fold families using three-dimensional shape-density representations. Proteins: Structure, Function and Bioinformatics. 2011, 80: 530-545.","journal-title":"Proteins: Structure, Function and Bioinformatics"},{"key":"5991_CR29","doi-asserted-by":"publisher","first-page":"178","DOI":"10.1002\/(SICI)1097-0134(20000501)39:2<178::AID-PROT8>3.0.CO;2-6","volume":"39","author":"DW Ritchie","year":"2000","unstructured":"Ritchie DW, Kemp GJ: Protein docking using spherical polar Fourier correlations. Proteins. 2000, 39: 178-194. 10.1002\/(SICI)1097-0134(20000501)39:2<178::AID-PROT8>3.0.CO;2-6.","journal-title":"Proteins"},{"key":"5991_CR30","doi-asserted-by":"publisher","first-page":"1273","DOI":"10.1109\/TPAMI.2002.1033218","volume":"24","author":"CJ Veenman","year":"2002","unstructured":"Veenman CJ, Reinders MJT, Backer E: A maximum variance cluster algorithm. Pattern Analysis and Machine Intelligence, IEEE Transactions. 2002, 24: 1273-1280. 10.1109\/TPAMI.2002.1033218.","journal-title":"Pattern Analysis and Machine Intelligence, IEEE Transactions"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-14-213.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-14-213\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-14-213.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,1,22]],"date-time":"2019-01-22T10:46:15Z","timestamp":1548153975000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-14-213"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,7,3]]},"references-count":30,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2013,12]]}},"alternative-id":["5991"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-14-213","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,7,3]]},"article-number":"213"}}