{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T10:53:21Z","timestamp":1740135201218,"version":"3.37.3"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2018,3,27]],"date-time":"2018-03-27T00:00:00Z","timestamp":1522108800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001665","name":"Agence Nationale de la Recherche","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001665","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1186\/s12859-018-2054-0","type":"journal-article","created":{"date-parts":[[2018,4,3]],"date-time":"2018-04-03T22:18:59Z","timestamp":1522793939000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["A method combining a random forest-based technique with the modeling of linkage disequilibrium through latent variables, to run multilocus genome-wide association studies"],"prefix":"10.1186","volume":"19","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6358-9420","authenticated-orcid":false,"given":"Christine","family":"Sinoquet","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,3,27]]},"reference":[{"key":"2054_CR1","doi-asserted-by":"publisher","unstructured":"Balding DJ. A tutorial on statistical methods for population association studies. Nat Genet. 2006; 7:781\u201390. https:\/\/doi.org\/10.1038\/nrg1916 .","DOI":"10.1038\/nrg1916"},{"key":"2054_CR2","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1007\/978-1-59745-389-9_7","volume":"376","author":"A DeWan","year":"2007","unstructured":"DeWan A, Klein RJ, Hoh J. Linkage disequilibrium mapping for complex disease genes. Methods Mol Biol. 2007; 376:85\u2013107.","journal-title":"Methods Mol Biol"},{"issue":"5547","key":"2054_CR3","doi-asserted-by":"publisher","first-page":"1719","DOI":"10.1126\/science.1065573","volume":"294","author":"N Patil","year":"2001","unstructured":"Patil N, Berno AJ, Hinds DA, Barrett WA, Doshi JM, Hacker CR, et al.Blocks of limited haplotype diversity revealed by high-resolution scanning of human chromosome 21. Science. 2001; 294(5547):1719\u201323.","journal-title":"Science"},{"key":"2054_CR4","doi-asserted-by":"crossref","unstructured":"Liu N, Zhang K, Zhao H. Haplotype-Association Analysis In: Rao DC, Charles Gu C, editors. Genetic Dissection of Complex Traits: 2008. p. 335\u2013405.","DOI":"10.1016\/S0065-2660(07)00414-2"},{"key":"2054_CR5","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1038\/sj.ejhg.5200619","volume":"9","author":"J Akey","year":"2001","unstructured":"Akey J, Jin L, Xiong M. Haplotypes vs single marker linkage disequilibrium tests: what do we gain?Eur J Hum Genet. 2001; 9:291\u2013300.","journal-title":"Eur J Hum Genet"},{"issue":"6","key":"2054_CR6","doi-asserted-by":"publisher","first-page":"675","DOI":"10.1007\/BF02945456","volume":"18","author":"P Bonizzoni","year":"2003","unstructured":"Bonizzoni P, Della Vedova G, Dondi R, Li J. The haplotyping problem: an overview of computational models and solutions. J Comput Sci Technol. 2003; 18(6):675\u201388.","journal-title":"J Comput Sci Technol"},{"key":"2054_CR7","doi-asserted-by":"publisher","first-page":"703","DOI":"10.1038\/nrg3054","volume":"12","author":"SR Browning","year":"2011","unstructured":"Browning SR, Browning BL. Haplotype phasing: existing methods and new developments. Nat Rev Genet. 2011; 12:703\u201314.","journal-title":"Nat Rev Genet"},{"key":"2054_CR8","doi-asserted-by":"publisher","first-page":"365","DOI":"10.1002\/gepi.20216","volume":"31","author":"BL Browning","year":"2007","unstructured":"Browning BL, Browning SR. Efficient multilocus association testing for whole genome association studies using localized haplotype clustering. Genet Epidemiol. 2007; 31:365\u201375.","journal-title":"Genet Epidemiol"},{"key":"2054_CR9","doi-asserted-by":"publisher","unstructured":"He Y, Li C, Amos CI, Xiong M, Ling H, Jin L. Accelerating haplotype-based genome-wide association study using perfect phylogeny and phase-known reference data. PLoS ONE. 2011; 6(7):e22097. https:\/\/doi.org\/10.1371\/journal.pone.0022097 .","DOI":"10.1371\/journal.pone.0022097"},{"issue":"1","key":"2054_CR10","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1109\/TCBB.2013.6","volume":"10","author":"X Yang","year":"2013","unstructured":"Yang X, Yang Q, Zhao H, Yu W. HapBoost: a fast approach to boosting haplotype association analyses in genome-wide association studies. IEEE\/ACM Trans Comput Biol Bioinform. 2013; 10(1):207\u201312.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinform"},{"key":"2054_CR11","unstructured":"Harb N, Saghir MAR, Dawy Z, Valderrama C. FPGA based accelerator for bioinformatics haplotype inference application. In: Proc. International Conference on Bioinformatics & Computational Biology BIOCOMP (WORLDCOMP). Las Vegas, Nevada, USA: 2012;212:166."},{"issue":"4","key":"2054_CR12","doi-asserted-by":"publisher","first-page":"629","DOI":"10.1086\/502802","volume":"78","author":"P Scheet","year":"2006","unstructured":"Scheet P, Stephens M. A fast and flexible method for large-scale population genotype data: applications to inferring missing genotypes and haplotypic phase. Am J Hum Genet. 2006; 78(4):629\u201344.","journal-title":"Am J Hum Genet"},{"key":"2054_CR13","doi-asserted-by":"publisher","first-page":"S51","DOI":"10.1002\/gepi.20473","volume":"33 Suppl 1","author":"S Szymczak","year":"2009","unstructured":"Szymczak S, Biernacka JM, Cordell HJ, Gonz\u00e1lez-Recio O, K\u00f6nig IR, Zhang H, et al.Machine learning in genome-wide association studies. Genet Epidemiol. 2009; 33 Suppl 1:S51\u20137.","journal-title":"Genet Epidemiol"},{"key":"2054_CR14","doi-asserted-by":"publisher","unstructured":"Okser S, Pahikkala T, Airola A, Salakoski T, Ripatti S, Aittokallio T. Regularized machine learning in the genetic prediction of complex traits. PLoS Genet. 2014; 10(11):e1004754. https:\/\/doi.org\/10.1371\/journal.pgen.1004754 .","DOI":"10.1371\/journal.pgen.1004754"},{"key":"2054_CR15","doi-asserted-by":"publisher","unstructured":"Waldmann P, M\u00e9sz\u00e0ros G, Gredler B, Fuerst C, S\u00f6lkner J. Evaluation of the lasso and the elastic net in genome-wide association studies. Front Genet. 2013; 4(4):270. https:\/\/doi.org\/10.3389\/fgene.2013.00270 .","DOI":"10.3389\/fgene.2013.00270"},{"key":"2054_CR16","doi-asserted-by":"publisher","unstructured":"Austin E, Pan W, Shen X. Penalized regression and risk prediction in genome-wide association studies. Stat Anal Data Min. 2013; 6(4). https:\/\/doi.org\/10.1002\/sam.11183 .","DOI":"10.1002\/sam.11183"},{"key":"2054_CR17","doi-asserted-by":"publisher","unstructured":"Roshan U, Chikkagoudar S, Wei Z, Wang K, Hakonarson H. Ranking causal variants and associated regions in genome-wide association studies by the support vector machine and random forest. Nucleic Acids Res. 2011:1\u20138. https:\/\/doi.org\/10.1093\/nar\/gkr064 .","DOI":"10.1093\/nar\/gkr064"},{"key":"2054_CR18","doi-asserted-by":"publisher","unstructured":"Motsinger-Reif AA, Ritchie MD. Neural networks for genetic epidemiology: past, present, and future. BioData Min. 2008; 1(3). https:\/\/doi.org\/10.1186\/1756--0381-1-3 .","DOI":"10.1186\/1756--0381-1-3"},{"issue":"6","key":"2054_CR19","doi-asserted-by":"publisher","first-page":"1088","DOI":"10.1086\/421249","volume":"74","author":"A Thomas","year":"2004","unstructured":"Thomas A, Camp NJ. Graphical modeling of the joint distribution of alleles at associated loci. Am J Hum Genet. 2004; 74(6):1088\u2013101.","journal-title":"Am J Hum Genet"},{"issue":"1","key":"2054_CR20","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1086\/505313","volume":"79","author":"CJ Verzilli","year":"2006","unstructured":"Verzilli CJ, Stallard N, Whittaker JC. Bayesian graphical models for genomewide association studies. Am J Hum Genet. 2006; 79(1):100\u201312.","journal-title":"Am J Hum Genet"},{"key":"2054_CR21","doi-asserted-by":"publisher","unstructured":"Touw WG, Bayjanov JR, Overmars L, Backus L, Boekhorst J, Wels M, et al.Data mining in the Life Sciences with Random Forest: a walk in the park or lost in the jungle?. Brief Bioinform. 2013; 14(3):315\u201326. https:\/\/doi.org\/10.1093\/bib\/bbs034 .","DOI":"10.1093\/bib\/bbs034"},{"issue":"1","key":"2054_CR22","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L. Random forests. Mach Learn. 2001; 45(1):5\u201332.","journal-title":"Mach Learn"},{"key":"2054_CR23","doi-asserted-by":"publisher","unstructured":"Goldstein BA, Hubbard AE, Cutler A, Barcellos LF. An application of Random Forests to a genome-wide association dataset: methodological considerations & new findings. BMC Genet. 2010; 11:49. https:\/\/doi.org\/10.1186\/1471-2156-11-49 .","DOI":"10.1186\/1471-2156-11-49"},{"key":"2054_CR24","doi-asserted-by":"publisher","first-page":"S5","DOI":"10.1186\/1471-2164-16-S2-S5","volume":"16 Suppl 2","author":"T-T Nguyen","year":"2015","unstructured":"Nguyen T-T, Huang JZ, Wu Q, Nguyen TT, Junjie Li M. Genome-wide association data classification and SNPs selection using two-stage quality-based Random Forests. BMC Genomics. 2015; 16 Suppl 2:S5.","journal-title":"BMC Genomics"},{"key":"2054_CR25","unstructured":"Kawaguchi A. Variable ranking by random forests model for genome-wide association study. In: Proc International MultiConference of Engineers and Computer Scientists. Hong Kong: 2012. p. 16."},{"key":"2054_CR26","doi-asserted-by":"publisher","unstructured":"Botta V, Louppe G, Geurts P, Wehenkel L. Exploiting SNP correlations within random forest for genome-wide association studies. PLoS ONE. 2014; 9(4):e93379. https:\/\/doi.org\/10.1371\/journal.pone.0093379 .","DOI":"10.1371\/journal.pone.0093379"},{"key":"2054_CR27","doi-asserted-by":"crossref","unstructured":"Sinoquet C, Mourad R. Modeling linkage disequilibrium and performing association studies through probabilistic graphical models: a visiting tour of recent advances In: Sinoquet C, Mourad R, editors. Probabilistic graphical models for genetics, genomics, and postgenomics. Oxford University Press: 2014. p. 217\u201346.","DOI":"10.1093\/acprof:oso\/9780198709022.003.0009"},{"key":"2054_CR28","doi-asserted-by":"publisher","unstructured":"Mourad R, Sinoquet C, Leray P. Probabilistic graphical models for genetic association studies. Brief Bioinform. 2012; 13(1):20\u201333. https:\/\/doi.org\/10.1093\/bib\/bbr015 .","DOI":"10.1093\/bib\/bbr015"},{"key":"2054_CR29","doi-asserted-by":"publisher","unstructured":"Thomas A. A method and program for estimating graphical models forfig1 linkage disequilibrium that scale linearly with the number of loci, and their application to gene drop simulation. Bioinformatics. 2009; 25(10):1287\u201392. https:\/\/doi.org\/10.1093\/bioinformatics\/btp146 .","DOI":"10.1093\/bioinformatics\/btp146"},{"key":"2054_CR30","doi-asserted-by":"publisher","unstructured":"Abel HJ, Thomas A. Accuracy and computational efficiency of a graphical modeling approach to linkage disequilibrium estimation. Stat Appl Genet Mol Biol. 2011; 10(1):5. https:\/\/doi.org\/10.2202\/1544--6115.1615 .","DOI":"10.2202\/1544--6115.1615"},{"key":"2054_CR31","doi-asserted-by":"publisher","unstructured":"Edwards D. Modelling and visualizing fine-scale linkage disequilibrium structure. BMC Bioinformatics. 2013; 14:179. https:\/\/doi.org\/10.1186\/1471-2105-14-179 .","DOI":"10.1186\/1471-2105-14-179"},{"key":"2054_CR32","doi-asserted-by":"publisher","unstructured":"Mourad R, Sinoquet C, Leray P. A hierarchical Bayesian network approach for linkage disequilibrium modeling and data-dimensionality reduction prior to genome-wide association studies. BMC Bioinformatics. 2011; 12(1):16. https:\/\/doi.org\/10.1186\/1471-2105-12-16 .","DOI":"10.1186\/1471-2105-12-16"},{"key":"2054_CR33","doi-asserted-by":"crossref","unstructured":"Breiman L. Bagging predictors. Machine Learning. 1996; 24(2):123\u201340.","DOI":"10.1007\/BF00058655"},{"issue":"8","key":"2054_CR34","doi-asserted-by":"publisher","first-page":"832","DOI":"10.1109\/34.709601","volume":"20","author":"T Ho","year":"1998","unstructured":"Ho T. The Random subspace method for constructing decision forests. IEEE Trans Pattern Anal Mach. Intell. 1998; 20(8):832\u201344.","journal-title":"IEEE Trans Pattern Anal Mach. Intell"},{"issue":"2","key":"2054_CR35","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1023\/A:1007607513941","volume":"40","author":"TG Dietterich","year":"2000","unstructured":"Dietterich TG. An experimental comparison of three methods for constructing ensembles of decision trees: Bagging, Boosting, and Randomization. Mach Learn. 2000; 40(2):139\u201357.","journal-title":"Mach Learn"},{"key":"2054_CR36","volume-title":"A walk into random forests. Adaptation and application to Genome-Wide Association Studies","author":"V Botta","year":"2013","unstructured":"Botta V. A walk into random forests. Adaptation and application to Genome-Wide Association Studies. Belgium: PhD Thesis, University of Li\u00e8ge.2013."},{"key":"2054_CR37","unstructured":"Zhi-Hua Z. Ensemble Methods: Foundations and Algorithms.Chapman and Hall\/CRC; 2012."},{"key":"2054_CR38","doi-asserted-by":"crossref","unstructured":"Geurts P, Ernst D, Wehenkel L. Extremely randomized trees. Mach Learn. 2006; 36:3\u201342.","DOI":"10.1007\/s10994-006-6226-1"},{"key":"2054_CR39","first-page":"697","volume":"5","author":"NL Zhang","year":"2004","unstructured":"Zhang NL. Hierarchical latent class models for cluster analysis. J Mach Learn Res. 2004; 5:697\u2013723.","journal-title":"J Mach Learn Res"},{"key":"2054_CR40","doi-asserted-by":"crossref","first-page":"157","DOI":"10.1613\/jair.3879","volume":"47","author":"R Mourad","year":"2013","unstructured":"Mourad R, Sinoquet C, Zhang NL, Liu T, Leray P. A survey on latent tree models and applications. J Artif Intell Res. 2013; 47:157\u2013203.","journal-title":"J Artif Intell Res"},{"key":"2054_CR41","doi-asserted-by":"crossref","unstructured":"Spencer CC, Su Z, Donnelly P, Marchini J. Designing genome-wide association studies: sample size, power, imputation, and the choice of genotyping chip. PLoS Genet. 2009;:5:e1000477+.","DOI":"10.1371\/journal.pgen.1000477"},{"key":"2054_CR42","doi-asserted-by":"crossref","unstructured":"The Wellcome Trust Case Control Consortium. Genome-wide association study of 14,000 cases of seven common diseases and 3000 shared controls. Nature. 2007; 447:661\u201378.","DOI":"10.1038\/nature05911"},{"key":"2054_CR43","doi-asserted-by":"crossref","unstructured":"Phan D-T, Leray P, Sinoquet C. Modeling genetical data with forests of latent trees for applications in association genetics at a large scale. Which clustering should be chosen? In: Proc. International Conference on Bioinformatics Models, Methods and Algorithms, Bioinformatics2015. Portugal, Lisbon: 2015. p. 5\u201316.","DOI":"10.5220\/0005179800050016"},{"key":"2054_CR44","doi-asserted-by":"crossref","unstructured":"Mekhnacha K, Ahuactzin JM, Bessi\u00e8re P, Mazer E, Smail L. Exact and approximate inference in ProBT. - Revue d\u2019Intelligence Artificielle. 2007; 21(3):295\u2013332.","DOI":"10.3166\/ria.21.295-332"},{"key":"2054_CR45","doi-asserted-by":"crossref","unstructured":"Bessi\u00e8re P, Mazer E, Ahuactzin J-M, Mekhnacha K. Bayesian Programming.Chapman and Hall\/CRC; 2013.","DOI":"10.1201\/b16111"},{"key":"2054_CR46","unstructured":"Ester M, Kriegel H-P, Sander J, Xu X. A density-based algorithm for discovering clusters in large spatial databases with noise. In: Proc. International Conference on Knowledge Discovery and Data mining.1996. p. 226\u201331."},{"key":"2054_CR47","unstructured":"Tan P-N, Steinbach M, Kumar V. Cluster analysis: basic concepts and algorithms. In: Tan P-N, Steinbach M, Kumar V. Introduction to Data Mining.2005. p. 125\u201346."},{"key":"2054_CR48","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","volume":"143","author":"JA Hanley","year":"1982","unstructured":"Hanley JA, McNeil BJ. The meaning and use of the area under a receiver operating characteristic (ROC) curve. Radiology. 1982; 143:29\u201336.","journal-title":"Radiology"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-018-2054-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s12859-018-2054-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-018-2054-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,13]],"date-time":"2019-10-13T21:21:15Z","timestamp":1571001675000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-018-2054-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,3,27]]},"references-count":48,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["2054"],"URL":"https:\/\/doi.org\/10.1186\/s12859-018-2054-0","relation":{},"ISSN":["1471-2105"],"issn-type":[{"type":"electronic","value":"1471-2105"}],"subject":[],"published":{"date-parts":[[2018,3,27]]},"assertion":[{"value":"10 December 2016","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 February 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 March 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Not applicable.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The author declares that she has no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}},{"value":"Springer Nature remains neutral with regard to jurisdictional claims in published maps and institutional affiliations.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Publisher\u2019s Note"}}],"article-number":"106"}}