{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T14:35:35Z","timestamp":1781620535705,"version":"3.54.5"},"reference-count":20,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2015,11,6]],"date-time":"2015-11-06T00:00:00Z","timestamp":1446768000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"},{"start":{"date-parts":[[2015,11,6]],"date-time":"2015-11-06T00:00:00Z","timestamp":1446768000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"Lieber Inst. for Brain Development"},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["GM105705-01"],"award-info":[{"award-number":["GM105705-01"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1186\/s12859-015-0808-5","type":"journal-article","created":{"date-parts":[[2015,11,6]],"date-time":"2015-11-06T12:57:27Z","timestamp":1446814647000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":60,"title":["Practical impacts of genomic data \u201ccleaning\u201d on biological discovery using surrogate variable analysis"],"prefix":"10.1186","volume":"16","author":[{"given":"Andrew E.","family":"Jaffe","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Thomas","family":"Hyde","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Joel","family":"Kleinman","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Daniel R.","family":"Weinbergern","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Joshua G.","family":"Chenoweth","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ronald D.","family":"McKay","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jeffrey T.","family":"Leek","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Carlo","family":"Colantuoni","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2015,11,6]]},"reference":[{"issue":"2","key":"808_CR1","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1093\/bioinformatics\/19.2.185","volume":"19","author":"BM Bolstad","year":"2003","unstructured":"Bolstad BM, Irizarry RA, Astrand M, Speed TP. A comparison of normalization methods for high density oligonucleotide array data based on variance and bias. Bioinformatics. 2003;19(2):185\u201393.","journal-title":"Bioinformatics"},{"issue":"2","key":"808_CR2","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1093\/biostatistics\/4.2.249","volume":"4","author":"RA Irizarry","year":"2003","unstructured":"Irizarry RA, Hobbs B, Collin F, Beazer-Barclay YD, Antonellis KJ, Scherf U, et al. Exploration, normalization, and summaries of high density oligonucleotide array probe level data. Biostatistics. 2003;4(2):249\u201364.","journal-title":"Biostatistics"},{"key":"808_CR3","doi-asserted-by":"publisher","first-page":"733","DOI":"10.1038\/nrg2825","volume":"11","author":"JT Leek","year":"2010","unstructured":"Leek JT, Scharpf RB, Bravo HC, Simcha D, Langmead B, Johnson WE, et al. Tackling the widespread and critical impact of batch effects in high-throughput data. Nat Rev Genet. 2010;11:733\u20139.","journal-title":"Nat Rev Genet"},{"key":"808_CR4","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1093\/biostatistics\/kxj037","volume":"8","author":"WE Johnson","year":"2007","unstructured":"Johnson WE, Li C, Rabinovic A. Adjusting batch effects in microarray expression data using empirical Bayes methods. Biostatistics. 2007;8:118\u201327.","journal-title":"Biostatistics"},{"key":"808_CR5","doi-asserted-by":"publisher","first-page":"1724","DOI":"10.1371\/journal.pgen.0030161","volume":"3","author":"JT Leek","year":"2007","unstructured":"Leek JT, Storey JD. Capturing heterogeneity in gene expression studies by surrogate variable analysis. PLoS Genet. 2007;3:1724\u201335.","journal-title":"PLoS Genet"},{"issue":"3","key":"808_CR6","doi-asserted-by":"publisher","first-page":"539","DOI":"10.1093\/biostatistics\/kxr034","volume":"13","author":"JA Gagnon-Bartsch","year":"2012","unstructured":"Gagnon-Bartsch JA, Speed TP. Using control genes to correct for unwanted variation in microarray data. Biostatistics. 2012;13(3):539\u201352.","journal-title":"Biostatistics"},{"issue":"2","key":"808_CR7","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1093\/biostatistics\/kxr055","volume":"13","author":"CG Lambert","year":"2012","unstructured":"Lambert CG, Black LJ. Learning from our GWAS mistakes: from experimental design to scientific method. Biostatistics. 2012;13(2):195\u2013203.","journal-title":"Biostatistics"},{"issue":"6","key":"808_CR8","doi-asserted-by":"publisher","first-page":"882","DOI":"10.1093\/bioinformatics\/bts034","volume":"28","author":"JT Leek","year":"2012","unstructured":"Leek JT, Johnson WE, Parker HS, Jaffe AE, Storey JD. The sva package for removing batch effects and other unwanted variation in high-throughput experiments. Bioinformatics. 2012;28(6):882\u20133.","journal-title":"Bioinformatics"},{"issue":"1","key":"808_CR9","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.scr.2012.09.002","volume":"10","author":"BS Mallon","year":"2012","unstructured":"Mallon BS, Chenoweth JG, Johnson KR, Hamilton RS, Tesar PJ, Yavatkar AS, et al. StemCellDB: the human pluripotent stem cell database at the national institutes of health. Stem Cell Res. 2012;10(1):57\u201366.","journal-title":"Stem Cell Res"},{"key":"808_CR10","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1007\/0-387-29362-0_23","volume-title":"Bioinformatics and computational biology solutions using r and bioconductor","author":"GK Smyth","year":"2005","unstructured":"Smyth GK. Limma: linear models for microarray data. In: Gentleman R, Carey V, Dudoit S, Irizarry R, Huber W, editors. Bioinformatics and computational biology solutions using r and bioconductor. New York: Springer; 2005. p. 397\u2013420."},{"issue":"1","key":"808_CR11","doi-asserted-by":"publisher","first-page":"166","DOI":"10.1093\/biostatistics\/kxr013","volume":"13","author":"AE Jaffe","year":"2012","unstructured":"Jaffe AE, Feinberg AP, Irizarry RA, Leek JT. Significance analysis and statistical dissection of variably methylated regions. Biostatistics. 2012;13(1):166\u201378.","journal-title":"Biostatistics"},{"issue":"1","key":"808_CR12","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1093\/ije\/dyr238","volume":"41","author":"AE Jaffe","year":"2012","unstructured":"Jaffe AE, Murakami P, Lee H, Leek JT, Fallin MD, Feinberg AP, et al. Bump hunting to identify differentially methylated regions in epigenetic epidemiology studies. Int J Epidemiol. 2012;41(1):200\u20139.","journal-title":"Int J Epidemiol"},{"issue":"8","key":"808_CR13","doi-asserted-by":"publisher","first-page":"690","DOI":"10.1002\/dneu.20895","volume":"71","author":"PA Georgala","year":"2011","unstructured":"Georgala PA, Carr CB, Price DJ. The role of Pax6 in forebrain development. Dev Neurobiol. 2011;71(8):690\u2013709.","journal-title":"Dev Neurobiol"},{"issue":"3","key":"808_CR14","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1016\/S1383-5742(00)00050-8","volume":"463","author":"S Landi","year":"2000","unstructured":"Landi S. Mammalian class theta GST and differential susceptibility to carcinogens: a review. Mutat Res. 2000;463(3):247\u201383.","journal-title":"Mutat Res"},{"issue":"5","key":"808_CR15","doi-asserted-by":"publisher","first-page":"e1000472","DOI":"10.1371\/journal.pgen.1000472","volume":"5","author":"Y Zhao","year":"2009","unstructured":"Zhao Y, Marotta M, Eichler EE, Eng C, Tanaka H. Linkage disequilibrium between two high-frequency deletion polymorphisms: implications for association studies involving the glutathione-S transferase (GST) genes. PLoS Genet. 2009;5(5):e1000472.","journal-title":"PLoS Genet"},{"issue":"7370","key":"808_CR16","doi-asserted-by":"publisher","first-page":"519","DOI":"10.1038\/nature10524","volume":"478","author":"C Colantuoni","year":"2011","unstructured":"Colantuoni C, Lipska BK, Ye T, Hyde TM, Tao R, Leek JT, et al. Temporal dynamics and genetic control of transcription in the human prefrontal cortex. Nature. 2011;478(7370):519\u201323.","journal-title":"Nature"},{"issue":"7","key":"808_CR17","doi-asserted-by":"publisher","first-page":"362","DOI":"10.1016\/S0168-9525(03)00140-9","volume":"19","author":"E Eisenberg","year":"2003","unstructured":"Eisenberg E, Levanon EY. Human housekeeping genes are compact. Trends Genet. 2003;19(7):362\u20135.","journal-title":"Trends Genet"},{"issue":"9","key":"808_CR18","doi-asserted-by":"publisher","first-page":"896","DOI":"10.1038\/nbt.2931","volume":"32","author":"D Risso","year":"2014","unstructured":"Risso D, Ngai J, Speed TP, Dudoit S. Normalization of RNA-seq data using factor analysis of control genes or samples. Nat Biotechnol. 2014;32(9):896\u2013902.","journal-title":"Nat Biotechnol"},{"issue":"16","key":"808_CR19","doi-asserted-by":"publisher","first-page":"7664","DOI":"10.1093\/nar\/gkv736","volume":"43","author":"L Peixoto","year":"2015","unstructured":"Peixoto L, Risso D, Poplawski SG, Wimmer ME, Speed TP, Wood MA, et al. How data analysis affects power, reproducibility and biological insight of RNA-seq studies in complex datasets. Nucleic Acids Res. 2015;43(16):7664\u201374.","journal-title":"Nucleic Acids Res"},{"key":"808_CR20","doi-asserted-by":"publisher","first-page":"e15","DOI":"10.1093\/nar\/30.4.e15","volume":"30","author":"YH Yang","year":"2002","unstructured":"Yang YH, Dudoit S, Luu P, Lin DM, Peng V, Ngai J, et al. Normalization for cDNA microarray data: a robust composite method addressing single and multiple slide systematic variation. Nucleic Acids Res. 2002;30:e15.","journal-title":"Nucleic Acids Res"}],"updated-by":[{"DOI":"10.1186\/s12859-016-1152-0","type":"erratum","label":"Erratum","source":"publisher","updated":{"date-parts":[[2016,8,10]],"date-time":"2016-08-10T00:00:00Z","timestamp":1470787200000}}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-015-0808-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s12859-015-0808-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-015-0808-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,14]],"date-time":"2020-05-14T10:47:01Z","timestamp":1589453221000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-015-0808-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,11,6]]},"references-count":20,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["808"],"URL":"https:\/\/doi.org\/10.1186\/s12859-015-0808-5","relation":{"erratum":[{"id-type":"doi","id":"10.1186\/s12859-016-1152-0","asserted-by":"object"}]},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,11,6]]},"assertion":[{"value":"29 April 2015","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 October 2015","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 November 2015","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"372"}}