{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T15:46:24Z","timestamp":1773330384044,"version":"3.50.1"},"reference-count":67,"publisher":"Springer Science and Business Media LLC","issue":"S8","content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2014,7]]},"DOI":"10.1186\/1471-2105-15-s8-s4","type":"journal-article","created":{"date-parts":[[2014,7,14]],"date-time":"2014-07-14T11:04:15Z","timestamp":1405335855000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Exploring representations of protein structure for automated remote homology detection and mapping of protein structure space"],"prefix":"10.1186","volume":"15","author":[{"given":"Kevin","family":"Molloy","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"M Jennifer","family":"Van","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Daniel","family":"Barbara","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Amarda","family":"Shehu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2014,7,14]]},"reference":[{"issue":"1","key":"6498_CR1","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1110\/ps.9.1.197","volume":"9","author":"SE Brenner","year":"2000","unstructured":"Brenner SE, Levitt M: Expectations from structural genomics. Protein Sci. 2000, 9 (1): 197-200.","journal-title":"Protein Sci"},{"key":"6498_CR2","doi-asserted-by":"publisher","first-page":"995","DOI":"10.1038\/nrm2281","volume":"8","author":"D Lee","year":"2007","unstructured":"Lee D, Redfern O, Orengo C: Predicting protein function from sequence and structure. Nat Rev Mol Cell Biol. 2007, 8: 995-1005. 10.1038\/nrm2281.","journal-title":"Nat Rev Mol Cell Biol"},{"key":"6498_CR3","doi-asserted-by":"publisher","first-page":"3389","DOI":"10.1093\/nar\/25.17.3389","volume":"25","author":"SF Altschul","year":"1997","unstructured":"Altschul SF, Madden TL, Schaeffer AA, Zhang J, Zhang Z, Miller W, Lipman DJ: Gapped BLAST and PSI-BLAST: a new generation of protein database search programs. Nucl Acids Res. 1997, 25: 3389-3402. 10.1093\/nar\/25.17.3389.","journal-title":"Nucl Acids Res"},{"issue":"1","key":"6498_CR4","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1093\/nar\/25.1.217","volume":"25","author":"A Bairoch","year":"1997","unstructured":"Bairoch A, Bucher P, Hoffmann K: The PROSITE database, its status in 1997. Nucl Acids Res. 1997, 25 (1): 217-221. 10.1093\/nar\/25.1.217.","journal-title":"Nucl Acids Res"},{"issue":"1","key":"6498_CR5","first-page":"134","volume":"32","author":"N Hulo","year":"2003","unstructured":"Hulo N, Sigrist CJ, Le Saux V, Langendijk-Genevaux PS, Bordoli L, Gattiker A, De Castro E, Bucher P, Bairoch A: Recent improvements to the PROSITE database. Nucl Acids Res. 2003, 32 (1): 134-137.","journal-title":"Nucl Acids Res"},{"issue":"3","key":"6498_CR6","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1002\/(SICI)1097-0134(199707)28:3<405::AID-PROT10>3.0.CO;2-L","volume":"28","author":"EL Sonnhammer","year":"1997","unstructured":"Sonnhammer EL, Eddy SR, Durbin R: Pfam: a comprehensive database of protein domain families based on seed alignments. Proteins: Struct Funct Bioinf. 1997, 28 (3): 405-420. 10.1002\/(SICI)1097-0134(199707)28:3<405::AID-PROT10>3.0.CO;2-L.","journal-title":"Proteins: Struct Funct Bioinf"},{"issue":"1","key":"6498_CR7","doi-asserted-by":"publisher","first-page":"320","DOI":"10.1093\/nar\/26.1.320","volume":"26","author":"EL Sonnhammer","year":"1998","unstructured":"Sonnhammer EL, Eddy SR, Birney E, Bateman A, Durbin R: Pfam: Multiple sequence alignments and HMM-profiles of protein domains. Nucl Acids Res. 1998, 26 (1): 320-322. 10.1093\/nar\/26.1.320.","journal-title":"Nucl Acids Res"},{"issue":"9","key":"6498_CR8","doi-asserted-by":"publisher","first-page":"755","DOI":"10.1093\/bioinformatics\/14.9.755","volume":"14","author":"SR Eddy","year":"1998","unstructured":"Eddy SR: Profile hidden Markov models. Bioinformatics. 1998, 14 (9): 755-763. 10.1093\/bioinformatics\/14.9.755.","journal-title":"Bioinformatics"},{"key":"6498_CR9","first-page":"149","volume-title":"Int Conf Intell Sys Mol Biol (ISMB)","author":"T Jaakkola","year":"1999","unstructured":"Jaakkola T, Diekhans M, Haussler D: Using the fisher kernel method to detect remote protein homologies. Int Conf Intell Sys Mol Biol (ISMB). Edited by: Lengauer, T., Schneider, R., Bork, P., Brutlag, D., Glasgow, J., Mewes, H.-W., Zimmer, R. 1999, AAAI Press, Menlo Park, CA, 149-158."},{"issue":"6","key":"6498_CR10","doi-asserted-by":"publisher","first-page":"857","DOI":"10.1089\/106652703322756113","volume":"10","author":"L Liao","year":"2002","unstructured":"Liao L, Noble WS: Combining pairwise sequence similarity and support vector machines for detecting remote protein evolutionary and structural relationships. J Comp Biol. 2002, 10 (6): 857-868.","journal-title":"J Comp Biol"},{"issue":"3","key":"6498_CR11","doi-asserted-by":"publisher","first-page":"361","DOI":"10.1016\/S0959-440X(96)80056-X","volume":"6","author":"SR Eddy","year":"1995","unstructured":"Eddy SR: Hidden Markov models. Curr Opinion Struct Biol. 1995, 6 (3): 361-365.","journal-title":"Curr Opinion Struct Biol"},{"key":"6498_CR12","doi-asserted-by":"publisher","first-page":"416","DOI":"10.1038\/185416a0","volume":"185","author":"MF Perutz","year":"1960","unstructured":"Perutz MF, Rossmann MG, Cullis AF, Muirhead H, Will G, North ACT: Structure of myoglobin: a three-dimensional fourier synthesis at 5.5 angstrom resolution. Nature. 1960, 185: 416-422. 10.1038\/185416a0.","journal-title":"Nature"},{"key":"6498_CR13","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1016\/S0959-440X(00)00214-1","volume":"11","author":"P Koehl","year":"2001","unstructured":"Koehl P: Protein structure similarities. Curr Opinion Struct Biol. 2001, 11: 348-353. 10.1016\/S0959-440X(00)00214-1.","journal-title":"Curr Opinion Struct Biol"},{"key":"6498_CR14","doi-asserted-by":"publisher","first-page":"1173","DOI":"10.1016\/j.jmb.2004.12.032","volume":"346","author":"R Kolodny","year":"2005","unstructured":"Kolodny R, Koehl P, Levitt M: Comprehensive evaluation of protein structure alignment methods: Scoring by geometric measures. J Mol Biol. 2005, 346: 1173-1188. 10.1016\/j.jmb.2004.12.032.","journal-title":"J Mol Biol"},{"key":"6498_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/0022-2836(89)90084-3","volume":"208","author":"WR Tayor","year":"1989","unstructured":"Tayor WR, Orengo CA: Protein structure alignment. J Mol Biol. 1989, 208: 1-22. 10.1016\/0022-2836(89)90084-3.","journal-title":"J Mol Biol"},{"issue":"7","key":"6498_CR16","doi-asserted-by":"publisher","first-page":"505","DOI":"10.1093\/protein\/2.7.505","volume":"2","author":"WR Taylor","year":"1989","unstructured":"Taylor WR, Orengo CA: A holistic approach to protein structure alignment. Protein Eng. 1989, 2 (7): 505-519. 10.1093\/protein\/2.7.505.","journal-title":"Protein Eng"},{"issue":"3","key":"6498_CR17","doi-asserted-by":"publisher","first-page":"654","DOI":"10.1110\/ps.8.3.654","volume":"8","author":"WR Taylor","year":"1999","unstructured":"Taylor WR: Protein structure comparison using iterated dynamic programming. Protein Sci. 1999, 8 (3): 654-665.","journal-title":"Protein Sci"},{"key":"6498_CR18","doi-asserted-by":"publisher","first-page":"617","DOI":"10.1016\/S0076-6879(96)66038-8","volume":"266","author":"CA Orengo","year":"1996","unstructured":"Orengo CA, Taylor WR: SSAP: sequential structure alignment program for protein structure comparison. Methods Enzymol. 1996, 266: 617-635.","journal-title":"Methods Enzymol"},{"issue":"Pt. 4","key":"6498_CR19","doi-asserted-by":"publisher","first-page":"842","DOI":"10.1107\/S0907444995016477","volume":"52","author":"GJ Kleywegt","year":"1996","unstructured":"Kleywegt GJ: Use of noncrystallographic symmetry in protein structure refinement. Acta Crystallogr D. 1996, 52 (Pt. 4): 842-857.","journal-title":"Acta Crystallogr D"},{"issue":"11","key":"6498_CR20","doi-asserted-by":"publisher","first-page":"5913","DOI":"10.1073\/pnas.95.11.5913","volume":"95","author":"M Levitt","year":"1998","unstructured":"Levitt M, Gerstein M: A unified statistical framework for sequence comparison and structure comparison. Proc Natl Acad Sci USA. 1998, 95 (11): 5913-5920. 10.1073\/pnas.95.11.5913.","journal-title":"Proc Natl Acad Sci USA"},{"issue":"3","key":"6498_CR21","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1016\/0960-9822(93)90255-M","volume":"3","author":"S Subbiah","year":"1993","unstructured":"Subbiah S, Laurents DV, Levitt M: Secondary-structure matching (SSM), a new tool for fast protein structure alignment in three dimensions. Curr Biol. 1993, 3 (3): 141-148. 10.1016\/0960-9822(93)90255-M.","journal-title":"Curr Biol"},{"issue":"1","key":"6498_CR22","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1006\/jmbi.1993.1489","volume":"233","author":"L Holm","year":"1993","unstructured":"Holm L, Sander C: Protein structure comparison by alignment of distance matrices. jmb. 1993, 233 (1): 123-138. 10.1006\/jmbi.1993.1489.","journal-title":"jmb"},{"issue":"9","key":"6498_CR23","doi-asserted-by":"publisher","first-page":"739","DOI":"10.1093\/protein\/11.9.739","volume":"11","author":"IN Shindyalov","year":"1998","unstructured":"Shindyalov IN, Bourne PE: Protein structure alignment by incremental combinatorial extension (CE) of the optimal path. Protein Eng. 1998, 11 (9): 739-747. 10.1093\/protein\/11.9.739.","journal-title":"Protein Eng"},{"issue":"13","key":"6498_CR24","doi-asserted-by":"publisher","first-page":"3370","DOI":"10.1093\/nar\/gkg571","volume":"31","author":"A Zemla","year":"2003","unstructured":"Zemla A: LGA: a method for finding 3D similarities in protein structures. Nucl Acids Res. 2003, 31 (13): 3370-3374. 10.1093\/nar\/gkg571.","journal-title":"Nucl Acids Res"},{"issue":"7","key":"6498_CR25","doi-asserted-by":"publisher","first-page":"2302","DOI":"10.1093\/nar\/gki524","volume":"33","author":"Y Zhang","year":"2005","unstructured":"Zhang Y, Skolnick J: TM-align: a protein structure alignment algorithm based on the TM-score. Nucl Acids Res. 2005, 33 (7): 2302-2309. 10.1093\/nar\/gki524.","journal-title":"Nucl Acids Res"},{"issue":"3","key":"6498_CR26","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1002\/prot.340230309","volume":"23","author":"T Madej","year":"1995","unstructured":"Madej T, Gibrat JF, Bryant SH: Threading a database of protein cores. Proteins: Struct Funct Bioinf. 1995, 23 (3): 356-369. 10.1002\/prot.340230309.","journal-title":"Proteins: Struct Funct Bioinf"},{"issue":"3","key":"6498_CR27","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1016\/S0959-440X(96)80058-3","volume":"6","author":"JF Gibrat","year":"1996","unstructured":"Gibrat JF, Madej T, Bryant SH: Suprising similarities in structure comparison. Curr Opinion Struct Biol. 1996, 6 (3): 377-385. 10.1016\/S0959-440X(96)80058-3.","journal-title":"Curr Opinion Struct Biol"},{"issue":"12.1","key":"6498_CR28","doi-asserted-by":"publisher","first-page":"2256","DOI":"10.1107\/S0907444904026460","volume":"60","author":"E Kissinel","year":"2004","unstructured":"Kissinel E, Henrick K: Secondary-structure matching (SSM), a new tool for fast protein structure alignment in three dimensions. Acta Crystallographica D Bio Crystallogr. 2004, 60 (12.1): 2256-2268.","journal-title":"Acta Crystallographica D Bio Crystallogr"},{"key":"6498_CR29","doi-asserted-by":"publisher","first-page":"3481","DOI":"10.1073\/pnas.0914097107","volume":"107","author":"I Budowski-Tal","year":"2010","unstructured":"Budowski-Tal I, Nov Y, Kolodny R: Fragbag, an accurate representation of protein structure, retrieves structural neighbors from the entire PDB quickly and accurately. Proc Natl Acad Sci USA. 2010, 107: 3481-3486. 10.1073\/pnas.0914097107.","journal-title":"Proc Natl Acad Sci USA"},{"key":"6498_CR30","doi-asserted-by":"publisher","first-page":"1235","DOI":"10.1016\/j.jmb.2005.03.037","volume":"348","author":"AE Todd","year":"2005","unstructured":"Todd AE, Marsden RL, Thornton JM, Orengo CA: Progress of structural genomics initiatives: an analysis of solved target structures. J Mol Biol. 2005, 348: 1235-1260. 10.1016\/j.jmb.2005.03.037.","journal-title":"J Mol Biol"},{"issue":"7","key":"6498_CR31","doi-asserted-by":"publisher","first-page":"1325","DOI":"10.1002\/pro.5560050711","volume":"5","author":"A Godzik","year":"1996","unstructured":"Godzik A: The structural alignment between two proteins: is there a unique answer?. Protein Sci. 1996, 5 (7): 1325-1338. 10.1002\/pro.5560050711.","journal-title":"Protein Sci"},{"issue":"5","key":"6498_CR32","doi-asserted-by":"publisher","first-page":"1307","DOI":"10.1016\/S0022-2836(03)00045-7","volume":"326","author":"A Stark","year":"2003","unstructured":"Stark A, Sunyaev S, Russell RB: A model for statistical significance of local similarities in structure. J Mol Biol. 2003, 326 (5): 1307-1316. 10.1016\/S0022-2836(03)00045-7.","journal-title":"J Mol Biol"},{"issue":"3","key":"6498_CR33","doi-asserted-by":"publisher","first-page":"773","DOI":"10.1110\/ps.03328504","volume":"13","author":"ML Sierk","year":"2004","unstructured":"Sierk ML, Pearson WR: Sensitivity and selectivity in protein structure comparison. Protein Sci. 2004, 13 (3): 773-785. 10.1110\/ps.03328504.","journal-title":"Protein Sci"},{"key":"6498_CR34","doi-asserted-by":"publisher","first-page":"3651","DOI":"10.1073\/pnas.0409772102","volume":"102","author":"J Hou","year":"2005","unstructured":"Hou J, S.-R J, Zhang C, Kim S: Global mapping of the protein structure space and application in structure-based inference of protein function. Proc Natl Acad Sci USA. 2005, 102: 3651-3656. 10.1073\/pnas.0409772102.","journal-title":"Proc Natl Acad Sci USA"},{"key":"6498_CR35","doi-asserted-by":"publisher","first-page":"75","DOI":"10.2174\/157489306775330606","volume":"1","author":"O Carugo","year":"2006","unstructured":"Carugo O: Rapid methds for comparing protein structures and scanning structure databases. Current Bioinformatics. 2006, 1: 75-83. 10.2174\/157489306775330606.","journal-title":"Current Bioinformatics"},{"issue":"12","key":"6498_CR36","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1093\/protein\/13.12.829","volume":"13","author":"AC Martin","year":"2000","unstructured":"Martin AC: The ups and downs of protein topology; rapid comparison of protein structure. Protein Eng. 2000, 13 (12): 829-837. 10.1093\/protein\/13.12.829.","journal-title":"Protein Eng"},{"key":"6498_CR37","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1186\/1756-0500-1-44","volume":"1","author":"S Kirilova","year":"2008","unstructured":"Kirilova S, Carugo O: Progress in the PRIDE technique for rapidly comparing protein three-dimensional structures. BMC Research Notes. 2008, 1: 44-10.1186\/1756-0500-1-44.","journal-title":"BMC Research Notes"},{"issue":"7","key":"6498_CR38","doi-asserted-by":"publisher","first-page":"1045","DOI":"10.1093\/bioinformatics\/bth036","volume":"20","author":"Z Aung","year":"2004","unstructured":"Aung Z, Tan KL: Rapid 3D protein structure database searching using information retrieval techniques. Bioinformatics. 2004, 20 (7): 1045-1052. 10.1093\/bioinformatics\/bth036.","journal-title":"Bioinformatics"},{"issue":"1","key":"6498_CR39","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1002\/prot.20517","volume":"61","author":"M Carpentier","year":"2005","unstructured":"Carpentier M, Brouillet S, Pothier J: YAKUSA: a fast structural database scanning method. Proteins: Struct Funct Bioinf. 2005, 61 (1): 137-151. 10.1002\/prot.20517.","journal-title":"Proteins: Struct Funct Bioinf"},{"issue":"22","key":"6498_CR40","doi-asserted-by":"publisher","first-page":"152","DOI":"10.1093\/nar\/gkl788","volume":"34","author":"AM Lisewski","year":"2006","unstructured":"Lisewski AM, Lichtarge O: Rapid detection of similarity in protein structure and function through contact metric distances. Nucl Acids Res. 2006, 34 (22): 152-10.1093\/nar\/gkl788.","journal-title":"Nucl Acids Res"},{"key":"6498_CR41","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1186\/1471-2105-11-155","volume":"11","author":"ZH Zhang","year":"2010","unstructured":"Zhang ZH, Hwee KL, Mihalek I: Reduced representation of protein structure: implications on efficiency and scope of detection of structural similarity. BMC Bioinformatics. 2010, 11: 155-10.1186\/1471-2105-11-155.","journal-title":"BMC Bioinformatics"},{"issue":"1","key":"6498_CR42","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1073\/pnas.2636460100","volume":"100","author":"P Rogen","year":"2003","unstructured":"Rogen P, Fain B: Automatic classification of protein structure by using gauss integrals. Proc Natl Acad Sci USA. 2003, 100 (1): 119-124. 10.1073\/pnas.2636460100.","journal-title":"Proc Natl Acad Sci USA"},{"issue":"4","key":"6498_CR43","doi-asserted-by":"publisher","first-page":"887","DOI":"10.1006\/jmbi.2001.5250","volume":"315","author":"O Carugo","year":"2002","unstructured":"Carugo O, Pongor S: Protein fold similarity estimated by a probabilistic approach based on c(a)-c(a) distance comparison. J Mol Biol. 2002, 315 (4): 887-898. 10.1006\/jmbi.2001.5250.","journal-title":"J Mol Biol"},{"key":"6498_CR44","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1016\/S0022-2836(02)00942-7","volume":"323","author":"R Kolodny","year":"2002","unstructured":"Kolodny R, Koehl P, Guibas L, Levitt M: Small libraries of protein fragments model native protein structures accurately. J Mol Biol. 2002, 323: 297-307. 10.1016\/S0022-2836(02)00942-7.","journal-title":"J Mol Biol"},{"issue":"1","key":"6498_CR45","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1186\/1748-7188-5-12","volume":"5","author":"SM Salem","year":"2010","unstructured":"Salem SM, Zaki MJ, Bystroff C: Flexible non-sequential protein structure alignment. Algorithms for Molecular Biology. 2010, 5 (1): 12-10.1186\/1748-7188-5-12.","journal-title":"Algorithms for Molecular Biology"},{"issue":"2","key":"6498_CR46","doi-asserted-by":"crossref","first-page":"246","DOI":"10.1093\/bioinformatics\/btg1086","volume":"19","author":"Y Ye","year":"2003","unstructured":"Ye Y, Godzik A: Flexible stucture alignment by chaining aligned fragment pairs allowing twists. Bioinformatics. 2003, 19 (2): 246-255.","journal-title":"Bioinformatics"},{"key":"6498_CR47","doi-asserted-by":"publisher","first-page":"12301","DOI":"10.1073\/pnas.1102727108","volume":"108","author":"M Osadchy","year":"2011","unstructured":"Osadchy M, Kolodny R: Maps of protein structure space reveal a fundamental relationship between protein structure and function. Proc Natl Acad Sci USA. 2011, 108: 12301-12306. 10.1073\/pnas.1102727108.","journal-title":"Proc Natl Acad Sci USA"},{"key":"6498_CR48","first-page":"1","volume-title":"AAAI Workshop","author":"C Keasar","year":"2013","unstructured":"Keasar C, Kolodny R: Using protein fragments for searching and data-mining protein databases. AAAI Workshop. 2013, 1-6."},{"key":"6498_CR49","first-page":"536","volume":"247","author":"AG Murzin","year":"1995","unstructured":"Murzin AG, Brenner SE, Hubbard T, Chothia C: SCOP: a structural classification of proteins database for the investigation of sequences and structures. J Mol Biol. 1995, 247: 536-540.","journal-title":"J Mol Biol"},{"issue":"8","key":"6498_CR50","doi-asserted-by":"publisher","first-page":"1093","DOI":"10.1016\/S0969-2126(97)00260-8","volume":"5","author":"CA Orengo","year":"1997","unstructured":"Orengo CA, Michie AD, Jones S, Jones DT, Swindells MB, Thornton JM: CATH database: A hierarchic classification of protein domain structures. Structure. 1997, 5 (8): 1093-1108. 10.1016\/S0969-2126(97)00260-8.","journal-title":"Structure"},{"key":"6498_CR51","doi-asserted-by":"publisher","first-page":"452","DOI":"10.1093\/nar\/gkg062","volume":"31","author":"FM Pearl","year":"2003","unstructured":"Pearl FM, Bennett CF, Bray JE: The CATH database: an extended protein family resource for structural and functional genomics. Nucl Acids Res. 2003, 31: 452-455. 10.1093\/nar\/gkg062.","journal-title":"Nucl Acids Res"},{"issue":"1","key":"6498_CR52","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1093\/nar\/28.1.235","volume":"28","author":"HM Berman","year":"2000","unstructured":"Berman HM, Westbrook J, Feng Z, Gilliland G, Bhat TN, Weissig H, Shindyalov IN, Bourne PE: The protein data bank. Nucl Acids Res. 2000, 28 (1): 235-242. 10.1093\/nar\/28.1.235.","journal-title":"Nucl Acids Res"},{"issue":"1","key":"6498_CR53","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1093\/nar\/26.1.316","volume":"26","author":"L Holm","year":"1998","unstructured":"Holm L, Sander C: Touring protein fold space with dali\/fssp. Nucl Acids Res. 1998, 26 (1): 316-319. 10.1093\/nar\/26.1.316.","journal-title":"Nucl Acids Res"},{"key":"6498_CR54","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1093\/bioinformatics\/btr249","volume":"27","author":"S Shivashankar","year":"2011","unstructured":"Shivashankar S, Srivathsan S, Ravindran B, Tendulkar AV: Multi-view methods for protein structure comparison using Latent Dirichlet Allocation. Bioinformatics. 2011, 27: 61-68. 10.1093\/bioinformatics\/btr249.","journal-title":"Bioinformatics"},{"key":"6498_CR55","volume-title":"Proceedings of the European Conference on Machine Learning and Knowledge Discovery in Databases: Part I ECML PKDD '09, pp 67-82","author":"L Alsumait","year":"2009","unstructured":"Alsumait L, Barbara D, Gentle J, Domeniconi C: Topic significance ranking of lda generative models. Proceedings of the European Conference on Machine Learning and Knowledge Discovery in Databases: Part I ECML PKDD '09, pp 67-82. 2009, Springer, Berlin, Heidelberg"},{"key":"6498_CR56","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511809071","volume-title":"Introduction to Information Retrieval","author":"CD Manning","year":"2008","unstructured":"Manning CD, Raghavan P, Schutze H: Introduction to Information Retrieval. 2008, Cambridge University Press, New York"},{"issue":"6","key":"6498_CR57","doi-asserted-by":"publisher","first-page":"656","DOI":"10.1107\/S0567739472001627","volume":"26","author":"AD McLachlan","year":"1972","unstructured":"McLachlan AD: A mathematical procedure for superimposing atomic coordinates of proteins. Acta Crystallogr A. 1972, 26 (6): 656-657. 10.1107\/S0567739472001627.","journal-title":"Acta Crystallogr A"},{"key":"6498_CR58","doi-asserted-by":"publisher","first-page":"2695","DOI":"10.1093\/bioinformatics\/btl461","volume":"22","author":"BJ Grant","year":"2006","unstructured":"Grant BJ, Rodrigues AP, ElSawy KM, McCammon JA, Caves LS: Bio3d: an R package for the comparative analysis of protein structures. Bioinformatics. 2006, 22: 2695-2696. 10.1093\/bioinformatics\/btl461.","journal-title":"Bioinformatics"},{"key":"6498_CR59","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei DM: Latent Dirichlet Allocation. J Mach Learn Res. 2003, 3: 993-1022.","journal-title":"J Mach Learn Res"},{"key":"6498_CR60","volume-title":"Latent Semantic Analysis: A Road to Meaning","author":"M Steyvers","year":"2006","unstructured":"Steyvers M, Griffiths T: Probabilistic topic models. Latent Semantic Analysis: A Road to Meaning. Edited by: Landauer, T., Mcnamara, D., Dennis, S., Kintsch, W. 2006, Laurence Erlbaum, Hillsdate, NJ, [http:\/\/cocosci.berkeley.edu\/tom\/papers\/SteyversGriffiths.pdf]"},{"key":"6498_CR61","first-page":"340","volume":"41","author":"S Kullback","year":"1987","unstructured":"Kullback S: Letter to the editor: The kullback-leibler distance. The American Statistician. 1987, 41: 340-341.","journal-title":"The American Statistician"},{"key":"6498_CR62","volume-title":"Technical report","author":"G Heinrich","year":"2004","unstructured":"Heinrich G: Parameter estimation for text analysis. Technical report. 2004, University of Leipzig, Germany"},{"key":"6498_CR63","doi-asserted-by":"publisher","DOI":"10.1002\/9781118165881","volume-title":"Nonparametric Statistics for Non-statisticians: A Step-by-step Approach","author":"GW Corder","year":"2009","unstructured":"Corder GW, Foreman DI: Nonparametric Statistics for Non-statisticians: A Step-by-step Approach. 2009, Wiley, New York"},{"key":"6498_CR64","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-2440-0","volume-title":"The Nature of Statistical Learning Theory","author":"VN Vapnik","year":"1995","unstructured":"Vapnik VN: The Nature of Statistical Learning Theory. 1995, Springer, New York, NY, USA"},{"issue":"1","key":"6498_CR65","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH: The weka data mining software: an update. SIGKDD Explor. Newsl. 2009, 11 (1): 10-18. 10.1145\/1656274.1656278.","journal-title":"Newsl"},{"issue":"1","key":"6498_CR66","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/S0097-8485(96)80004-0","volume":"20","author":"M Gribskov","year":"1996","unstructured":"Gribskov M, Robinson NL: Use of receiver operating characteristic (ROC) analysis to evaluate sequence matching. Comput Chem. 1996, 20 (1): 25-33. 10.1016\/S0097-8485(96)80004-0.","journal-title":"Comput Chem"},{"issue":"1","key":"6498_CR67","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1016\/0263-7855(96)00018-5","volume":"14","author":"W Humphrey","year":"1996","unstructured":"Humphrey W, Dalke A, Schulten K: VMD - Visual Molecular Dynamics. J Mol Graph Model. 1996, 14 (1): 33-38. 10.1016\/0263-7855(96)00018-5. [http:\/\/www.ks.uiuc.edu\/Research\/vmd\/]","journal-title":"J Mol Graph Model"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-15-S8-S4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,15]],"date-time":"2023-07-15T06:34:59Z","timestamp":1689402899000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-15-S8-S4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,7]]},"references-count":67,"journal-issue":{"issue":"S8","published-print":{"date-parts":[[2014,7]]}},"alternative-id":["6498"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-15-s8-s4","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,7]]},"assertion":[{"value":"14 July 2014","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"S4"}}