{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T20:33:43Z","timestamp":1772138023110,"version":"3.50.1"},"reference-count":56,"publisher":"Oxford University Press (OUP)","issue":"3","license":[{"start":{"date-parts":[[2024,5,7]],"date-time":"2024-05-07T00:00:00Z","timestamp":1715040000000},"content-version":"vor","delay-in-days":41,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000062","name":"National Institute of Diabetes and Digestive and Kidney Diseases","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000062","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000054","name":"National Cancer Institute","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000054","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000057","name":"National Institute of General Medicine","doi-asserted-by":"crossref","id":[{"id":"10.13039\/100000057","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["U54DK107977"],"award-info":[{"award-number":["U54DK107977"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["U24CA180996"],"award-info":[{"award-number":["U24CA180996"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01GM121459"],"award-info":[{"award-number":["R01GM121459"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R35HG011922"],"award-info":[{"award-number":["R35HG011922"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["UM1HG011585"],"award-info":[{"award-number":["UM1HG011585"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R35GM149323"],"award-info":[{"award-number":["R35GM149323"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"name":"San Diego Institutional Research and Academic Career Development Award"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,3,27]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:p>Hi-C data are commonly normalized using single sample processing methods, with focus on comparisons between regions within a given contact map. Here, we aim to compare contact maps across different samples. We demonstrate that unwanted variation, of likely technical origin, is present in Hi-C data with replicates from different individuals, and that properties of this unwanted variation change across the contact map. We present band-wise normalization and batch correction, a method for normalization and batch correction of Hi-C data and show that it substantially improves comparisons across samples, including in a quantitative trait loci analysis as well as differential enrichment across cell types.<\/jats:p>","DOI":"10.1093\/bib\/bbae217","type":"journal-article","created":{"date-parts":[[2024,4,24]],"date-time":"2024-04-24T15:47:49Z","timestamp":1713973669000},"source":"Crossref","is-referenced-by-count":5,"title":["Removing unwanted variation between samples in Hi-C experiments"],"prefix":"10.1093","volume":"25","author":[{"given":"Kipper","family":"Fletez-Brant","sequence":"first","affiliation":[{"name":"McKusick-Nathans Institute of Genetic Medicine, Johns Hopkins School of Medicine , Baltimore, MD 21205 , USA"},{"name":"Department of Biostatistics, Johns Hopkins Bloomberg School of Public Health , Baltmore, MD 21205 , USA"}]},{"given":"Yunjiang","family":"Qiu","sequence":"additional","affiliation":[{"name":"Bioinformatics and Systems Biology Graduate Program, University of California , San Diego, La Jolla, CA 92093 , USA"},{"name":"Ludwig Institute for Cancer Research , New York, NY 10016 , USA"}]},{"given":"David U","family":"Gorkin","sequence":"additional","affiliation":[{"name":"Ludwig Institute for Cancer Research , New York, NY 10016 , USA"},{"name":"Department of Cellular and Molecular Medicine, University of California at San Diego , La Jolla, CA 92093 , USA"},{"name":"Currently: Department of Biology. Emory University. Atlanta , GA 30322 , USA"}]},{"given":"Ming","family":"Hu","sequence":"additional","affiliation":[{"name":"Department of Quantitative Health Sciences, Lerner Research Institute , Cleveland Clinic Foundation, Cleveland, OH 44196 , USA"}]},{"given":"Kasper D","family":"Hansen","sequence":"additional","affiliation":[{"name":"McKusick-Nathans Institute of Genetic Medicine, Johns Hopkins School of Medicine , Baltimore, MD 21205 , USA"},{"name":"Department of Biostatistics, Johns Hopkins Bloomberg School of Public Health , Baltmore, MD 21205 , USA"}]}],"member":"286","published-online":{"date-parts":[[2024,5,6]]},"reference":[{"key":"2024050706054502700_ref1","doi-asserted-by":"crossref","first-page":"289","DOI":"10.1126\/science.1181369","article-title":"Comprehensive mapping of long-range interactions reveals folding principles of the human genome","volume":"326","author":"Lieberman-Aiden","year":"2009","journal-title":"Science"},{"key":"2024050706054502700_ref2","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1101\/gad.179804.111","article-title":"A decade of 3C technologies: insights into nuclear organization","volume":"26","author":"de Wit","year":"2012","journal-title":"Genes Dev"},{"key":"2024050706054502700_ref3","doi-asserted-by":"crossref","first-page":"390","DOI":"10.1038\/nrg3454","article-title":"Exploring the three-dimensional organization of genomes: interpreting chromatin interaction data","volume":"14","author":"Dekker","year":"2013","journal-title":"Nat Rev Genet"},{"key":"2024050706054502700_ref4","doi-asserted-by":"crossref","first-page":"743","DOI":"10.1038\/nrm.2016.104","article-title":"Genome-wide mapping and analysis of chromosome architecture","volume":"17","author":"Schmitt","year":"2016","journal-title":"Nat Rev Mol Cell Biol"},{"key":"2024050706054502700_ref5","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1038\/nmeth.4146","article-title":"How best to identify chromosomal interactions: a comparison of approaches","volume":"14","author":"Davies","year":"2017","journal-title":"Nat Methods"},{"key":"2024050706054502700_ref6","doi-asserted-by":"crossref","first-page":"376","DOI":"10.1038\/nature11082","article-title":"Topological domains in mammalian genomes identified by analysis of chromatin interactions","volume":"485","author":"Dixon","year":"2012","journal-title":"Nature"},{"key":"2024050706054502700_ref7","doi-asserted-by":"crossref","first-page":"381","DOI":"10.1038\/nature11049","article-title":"Spatial partitioning of the regulatory landscape of the X-inactivation Centre","volume":"485","author":"Nora","year":"2012","journal-title":"Nature"},{"key":"2024050706054502700_ref8","doi-asserted-by":"crossref","first-page":"458","DOI":"10.1016\/j.cell.2012.01.010","article-title":"Three-dimensional folding and functional organization principles of the drosophila genome","volume":"148","author":"Sexton","year":"2012","journal-title":"Cell"},{"key":"2024050706054502700_ref9","doi-asserted-by":"crossref","first-page":"1665","DOI":"10.1016\/j.cell.2014.11.021","article-title":"A 3D map of the human genome at kilobase resolution reveals principles of chromatin looping","volume":"159","author":"Rao","year":"2014","journal-title":"Cell"},{"key":"2024050706054502700_ref10","doi-asserted-by":"crossref","first-page":"255","DOI":"10.1186\/s13059-019-1855-4","article-title":"Common DNA sequence variation influences 3-dimensional conformation of the human genome","volume":"20","author":"Gorkin","year":"2019","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref11","doi-asserted-by":"crossref","first-page":"696","DOI":"10.1016\/j.tig.2015.10.004","article-title":"The hierarchy of transcriptional activation: from enhancer to promoter","volume":"31","author":"Vernimmen","year":"2015","journal-title":"Trends Genet"},{"key":"2024050706054502700_ref12","doi-asserted-by":"crossref","first-page":"999","DOI":"10.1101\/gr.160374.113","article-title":"Statistical confidence estimation for hi-C data reveals regulatory chromatin contacts","volume":"24","author":"Ay","year":"2014","journal-title":"Genome Res"},{"key":"2024050706054502700_ref13","doi-asserted-by":"crossref","first-page":"15454","DOI":"10.1038\/ncomms15454","article-title":"An integrated model for detecting significant chromatin interactions from high-resolution hi-C data","volume":"8","author":"Carty","year":"2017","journal-title":"Nat Commun"},{"key":"2024050706054502700_ref14","doi-asserted-by":"crossref","first-page":"180","DOI":"10.1186\/s13059-015-0741-y","article-title":"Reconstructing a\/B compartments as revealed by hi-C using long-range correlations in epigenetic data","volume":"16","author":"Fortin","year":"2015","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref15","doi-asserted-by":"crossref","first-page":"1059","DOI":"10.1038\/ng.947","article-title":"Probabilistic modeling of hi-C contact maps eliminates systematic biases to characterize global chromosomal architecture","volume":"43","author":"Yaffe","year":"2011","journal-title":"Nat Genet"},{"key":"2024050706054502700_ref16","doi-asserted-by":"crossref","first-page":"3131","DOI":"10.1093\/bioinformatics\/bts570","article-title":"HiCNorm: removing biases in hi-C data via Poisson regression","volume":"28","author":"Hu","year":"2012","journal-title":"Bioinformatics"},{"key":"2024050706054502700_ref17","doi-asserted-by":"crossref","first-page":"e49","DOI":"10.1093\/nar\/gky064","article-title":"OneD: increasing reproducibility of hi-C samples with abnormal karyotypes","volume":"46","author":"Vidal","year":"2018","journal-title":"Nucleic Acids Res"},{"key":"2024050706054502700_ref18","doi-asserted-by":"crossref","first-page":"999","DOI":"10.1038\/nmeth.2148","article-title":"Iterative correction of hi-C data reveals hallmarks of chromosome organization","volume":"9","author":"Imakaev","year":"2012","journal-title":"Nat Methods"},{"key":"2024050706054502700_ref19","doi-asserted-by":"crossref","first-page":"1029","DOI":"10.1093\/imanum\/drs019","article-title":"A fast algorithm for matrix balancing","volume":"33","author":"Knight","year":"2013","journal-title":"IMA J Numer Anal"},{"key":"2024050706054502700_ref20","doi-asserted-by":"crossref","first-page":"2199","DOI":"10.1093\/bioinformatics\/btx152","article-title":"HiC-Spector: a matrix library for spectral and reproducibility analysis of hi-C contact maps","volume":"33","author":"Yan","year":"2017","journal-title":"Bioinformatics"},{"key":"2024050706054502700_ref21","doi-asserted-by":"crossref","first-page":"733","DOI":"10.1038\/nrg2825","article-title":"Tackling the widespread and critical impact of batch effects in high-throughput data","volume":"11","author":"Leek","year":"2010","journal-title":"Nat Rev Genet"},{"key":"2024050706054502700_ref22","doi-asserted-by":"crossref","first-page":"1724","DOI":"10.1371\/journal.pgen.0030161","article-title":"Capturing heterogeneity in gene expression studies by surrogate variable analysis","volume":"3","author":"Leek","year":"2007","journal-title":"PLoS Genet"},{"key":"2024050706054502700_ref23","doi-asserted-by":"crossref","first-page":"18718","DOI":"10.1073\/pnas.0808709105","article-title":"A general framework for multiple testing dependence","volume":"105","author":"Leek","year":"2008","journal-title":"PNAS"},{"key":"2024050706054502700_ref24","doi-asserted-by":"crossref","first-page":"539","DOI":"10.1093\/biostatistics\/kxr034","article-title":"Using control genes to correct for unwanted variation in microarray data","volume":"13","author":"Gagnon-Bartsch","year":"2012","journal-title":"Biostatistics"},{"key":"2024050706054502700_ref25","doi-asserted-by":"crossref","first-page":"118","DOI":"10.1093\/biostatistics\/kxj037","article-title":"Adjusting batch effects in microarray expression data using empirical Bayes methods","volume":"8","author":"Johnson","year":"2007","journal-title":"Biostatistics"},{"key":"2024050706054502700_ref26","doi-asserted-by":"crossref","first-page":"e1000770","DOI":"10.1371\/journal.pcbi.1000770","article-title":"A Bayesian framework to account for complex non-genetic factors in gene expression levels greatly increases power in eQTL studies","volume":"6","author":"Stegle","year":"2010","journal-title":"PLoS Comput Biol"},{"key":"2024050706054502700_ref27","doi-asserted-by":"crossref","first-page":"gku864","DOI":"10.1093\/nar\/gku864","article-title":"Svaseq: removing batch effects and other unwanted noise from sequencing data","volume":"42","author":"Leek","year":"2014","journal-title":"Nucleic Acids Res"},{"key":"2024050706054502700_ref28","doi-asserted-by":"crossref","first-page":"896","DOI":"10.1038\/nbt.2931","article-title":"Normalization of RNA-seq data using factor analysis of control genes or samples","volume":"32","author":"Risso","year":"2014","journal-title":"Nat Biotechnol"},{"key":"2024050706054502700_ref29","doi-asserted-by":"crossref","first-page":"258","DOI":"10.1186\/s12859-015-0683-0","article-title":"diffHic: a Bioconductor package to detect differential genomic interactions in hi-C data","volume":"16","author":"Lun","year":"2015","journal-title":"BMC Bioinformatics"},{"key":"2024050706054502700_ref30","doi-asserted-by":"crossref","first-page":"279","DOI":"10.1186\/s12859-018-2288-x","article-title":"HiCcompare: an R-package for joint normalization and comparison of HI-C datasets","volume":"19","author":"Stansfield","year":"2018","journal-title":"BMC Bioinformatics"},{"issue":"17","key":"2024050706054502700_ref31","doi-asserted-by":"crossref","first-page":"2916","DOI":"10.1093\/bioinformatics\/btz048","article-title":"multiHiCcompare: joint normalization and comparative analysis of complex hi-C experiments","volume":"35","author":"Stansfield","year":"2019","journal-title":"Bioinformatics"},{"key":"2024050706054502700_ref32","doi-asserted-by":"crossref","first-page":"e15","DOI":"10.1093\/nar\/30.4.e15","article-title":"Normalization for cDNA microarray data: a robust composite method addressing single and multiple slide systematic variation","volume":"30","author":"Yang","year":"2002","journal-title":"Nucleic Acids Res"},{"key":"2024050706054502700_ref33","doi-asserted-by":"crossref","first-page":"789","DOI":"10.1038\/nature02168","article-title":"The international HapMap project","volume":"426","author":"International HapMap Consortium","year":"2003","journal-title":"Nature"},{"key":"2024050706054502700_ref34","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1186\/s13059-019-1658-7","article-title":"Measuring the reproducibility and quality of hi-C data","volume":"20","author":"Yardimci","year":"2019","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref35","doi-asserted-by":"crossref","first-page":"1939","DOI":"10.1101\/gr.220640.117","article-title":"HiCRep: assessing the reproducibility of hi-C data using a stratum-adjusted correlation coefficient","volume":"27","author":"Yang","year":"2017","journal-title":"Genome Res"},{"key":"2024050706054502700_ref36","doi-asserted-by":"crossref","first-page":"1217","DOI":"10.1038\/ng2142","article-title":"Population genomics of human gene expression","volume":"39","author":"Stranger","year":"2007","journal-title":"Nat Genet"},{"key":"2024050706054502700_ref37","doi-asserted-by":"crossref","first-page":"768","DOI":"10.1038\/nature08872","article-title":"Understanding mechanisms underlying human gene expression variation with RNA sequencing","volume":"464","author":"Pickrell","year":"2010","journal-title":"Nature"},{"key":"2024050706054502700_ref38","doi-asserted-by":"crossref","first-page":"773","DOI":"10.1038\/nature08903","article-title":"Transcriptome genetics using second generation sequencing in a Caucasian population","volume":"464","author":"Montgomery","year":"2010","journal-title":"Nature"},{"key":"2024050706054502700_ref39","doi-asserted-by":"crossref","first-page":"390","DOI":"10.1038\/nature10808","article-title":"DNase I sensitivity QTLs are a major determinant of human expression variation","volume":"482","author":"Degner","year":"2012","journal-title":"Nature"},{"key":"2024050706054502700_ref40","doi-asserted-by":"crossref","first-page":"750","DOI":"10.1126\/science.1242510","article-title":"Extensive variation in chromatin states across humans","volume":"342","author":"Kasowski","year":"2013","journal-title":"Science"},{"key":"2024050706054502700_ref41","doi-asserted-by":"crossref","first-page":"747","DOI":"10.1126\/science.1242429","article-title":"Identification of genetic variants that affect histone modifications in human cells","volume":"342","author":"McVicker","year":"2013","journal-title":"Science"},{"key":"2024050706054502700_ref42","doi-asserted-by":"crossref","first-page":"744","DOI":"10.1126\/science.1242463","article-title":"Coordinated effects of sequence variation on DNA binding, chromatin structure, and transcription","volume":"342","author":"Kilpinen","year":"2013","journal-title":"Science"},{"key":"2024050706054502700_ref43","doi-asserted-by":"crossref","first-page":"R10","DOI":"10.1186\/gb-2011-12-1-r10","article-title":"DNA methylation patterns associate with genetic and gene expression variation in HapMap cell lines","volume":"12","author":"Bell","year":"2011","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref44","doi-asserted-by":"crossref","first-page":"829","DOI":"10.1016\/j.ajhg.2010.10.018","article-title":"Population differences in the rate of proliferation of international HapMap cell lines","volume":"87","author":"Stark","year":"2010","journal-title":"Am J Hum Genet"},{"key":"2024050706054502700_ref45","doi-asserted-by":"crossref","first-page":"e1000287","DOI":"10.1371\/journal.pgen.1000287","article-title":"Genetic analysis of human traits in vitro: drug response and gene expression in lymphoblastoid cell lines","volume":"4","author":"Choy","year":"2008","journal-title":"PLoS Genet"},{"issue":"1","key":"2024050706054502700_ref46","doi-asserted-by":"crossref","first-page":"311","DOI":"10.1093\/bioinformatics\/btz540","article-title":"Cooler: scalable storage for hi-C data and other genomically labeled arrays","volume":"36","author":"Abdennur","year":"2020","journal-title":"Bioinformatics"},{"key":"2024050706054502700_ref47","doi-asserted-by":"crossref","DOI":"10.1093\/hmg\/ddx043","article-title":"Conditional eQTL analysis reveals allelic heterogeneity of gene expression","volume":"26","author":"Jansen","year":"2017","journal-title":"Hum Mol Genet"},{"key":"2024050706054502700_ref48","doi-asserted-by":"crossref","first-page":"256","DOI":"10.1186\/s13059-020-02167-0","article-title":"Mustache: multi-scale detection of chromatin loops from hi-C and micro-C maps using scale-space representation","volume":"21","author":"Ardakany","year":"2020","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref49","article-title":"TADCompare: an R package for differential and temporal analysis of topologically associated domains","volume":"11","author":"Kreswell","year":"2020","journal-title":"Front Genet"},{"issue":"1","key":"2024050706054502700_ref50","doi-asserted-by":"crossref","first-page":"1054","DOI":"10.1038\/s41467-019-08940-5","article-title":"Subtle changes in chromatin loop contact propensity are associated with differential gene regulation and expression","volume":"10","author":"Greenwald","year":"2019","journal-title":"Nat Commun"},{"key":"2024050706054502700_ref51","first-page":"404962","article-title":"Overcoming systematic errors caused by log-transformation of normalized single-cell RNA sequencing data","author":"Lun","year":"2018","journal-title":"bioRxiv"},{"issue":"1","key":"2024050706054502700_ref52","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1016\/j.cels.2015.07.012","article-title":"Juicebox provides a visualization system for hi-C contact maps with unlimited zoom","volume":"3","author":"Durand","year":"2016","journal-title":"Cell Systems"},{"issue":"1","key":"2024050706054502700_ref53","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1186\/s13059-018-1486-1","article-title":"HiGlass: web-based visual exploration and analysis of genome interaction maps","volume":"19","author":"Kerpedjiev","year":"2018","journal-title":"Genome Biol"},{"key":"2024050706054502700_ref54","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1186\/s12859-018-2263-6","article-title":"Alternative empirical Bayes models for adjusting for batch effects in genomic studies","volume":"19","author":"Zhang","year":"2019","journal-title":"BMC Bioinformatics"},{"key":"2024050706054502700_ref55","doi-asserted-by":"crossref","first-page":"7111","DOI":"10.1038\/s41467-023-42651-2","article-title":"Tracing cancer evolution and heterogeneity using hi-C","volume":"14","author":"Erdmann-Pham","year":"2023","journal-title":"Nat Commun"},{"key":"2024050706054502700_ref56","doi-asserted-by":"crossref","first-page":"693","DOI":"10.1016\/j.cell.2017.04.013","article-title":"The Cohesin release factor WAPL restricts chromatin loop extension","volume":"169","author":"Haarhuis","year":"2017","journal-title":"Cell"}],"container-title":["Briefings in Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/25\/3\/bbae217\/57420008\/bbae217.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/25\/3\/bbae217\/57420008\/bbae217.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,7]],"date-time":"2024-05-07T02:06:33Z","timestamp":1715047593000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bib\/article\/doi\/10.1093\/bib\/bbae217\/7665587"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,27]]},"references-count":56,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,3,27]]}},"URL":"https:\/\/doi.org\/10.1093\/bib\/bbae217","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/214361","asserted-by":"object"}]},"ISSN":["1467-5463","1477-4054"],"issn-type":[{"value":"1467-5463","type":"print"},{"value":"1477-4054","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,5,1]]},"published":{"date-parts":[[2024,3,27]]},"article-number":"bbae217"}}