{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,12]],"date-time":"2026-04-12T14:34:44Z","timestamp":1776004484784,"version":"3.50.1"},"reference-count":17,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2021,6,21]],"date-time":"2021-06-21T00:00:00Z","timestamp":1624233600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,6,21]],"date-time":"2021-06-21T00:00:00Z","timestamp":1624233600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100000051","name":"U.S. Department of Health & Human Services | NIH | National Human Genome Research Institute","doi-asserted-by":"publisher","award":["HG009141"],"award-info":[{"award-number":["HG009141"]}],"id":[{"id":"10.13039\/100000051","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000057","name":"U.S. Department of Health & Human Services | NIH | National Institute of General Medical Sciences","doi-asserted-by":"publisher","award":["GM124355"],"award-info":[{"award-number":["GM124355"]}],"id":[{"id":"10.13039\/100000057","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Comput Sci"],"DOI":"10.1038\/s43588-021-00085-0","type":"journal-article","created":{"date-parts":[[2021,6,21]],"date-time":"2021-06-21T12:04:08Z","timestamp":1624277048000},"page":"441-447","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Balancing efficient analysis and storage of quantitative genomics data with the D4 format and d4tools"],"prefix":"10.1038","volume":"1","author":[{"given":"Hao","family":"Hou","sequence":"first","affiliation":[]},{"given":"Brent","family":"Pedersen","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1756-0859","authenticated-orcid":false,"given":"Aaron","family":"Quinlan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,6,21]]},"reference":[{"key":"85_CR1","doi-asserted-by":"publisher","first-page":"e46922","DOI":"10.7554\/eLife.46922","volume":"8","author":"TA Sasani","year":"2019","unstructured":"Sasani, T. A. et al. Large, three-generation human families reveal post-zygotic mosaicism and variability in germline mutation accumulation. Elife 8, e46922 (2019).","journal-title":"Elife"},{"key":"85_CR2","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1093\/bioinformatics\/btp616","volume":"26","author":"MD Robinson","year":"2010","unstructured":"Robinson, M. D., McCarthy, D. J. & Smyth, G. K. edgeR: a Bioconductor package for differential expression analysis of digital gene expression data. Bioinformatics 26, 139\u2013140 (2010).","journal-title":"Bioinformatics"},{"key":"85_CR3","doi-asserted-by":"crossref","unstructured":"Anders, S. & Huber, W. Differential expression analysis for sequence count data. Genome Biol. 11, R106 (2010).","DOI":"10.1186\/gb-2010-11-10-r106"},{"key":"85_CR4","doi-asserted-by":"publisher","unstructured":"2 Chromatin patterns at transcription factor binding sites. Nature https:\/\/doi.org\/10.1038\/nature28171 (2019).","DOI":"10.1038\/nature28171"},{"key":"85_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1093\/gigascience\/gix090","volume":"6","author":"BS Pedersen","year":"2017","unstructured":"Pedersen, B. S., Collins, R. L., Talkowski, M. E. & Quinlan, A. R. Indexcov: fast coverage quality control for whole-genome sequencing. Gigascience 6, 1\u20136 (2017).","journal-title":"Gigascience"},{"key":"85_CR6","doi-asserted-by":"publisher","first-page":"2204","DOI":"10.1093\/bioinformatics\/btq351","volume":"26","author":"WJ Kent","year":"2010","unstructured":"Kent, W. J., Zweig, A. S., Barber, G., Hinrichs, A. S. & Karolchik, D. bigWig and bigBed: enabling browsing of large distributed datasets. Bioinformatics 26, 2204\u20132207 (2010).","journal-title":"Bioinformatics"},{"key":"85_CR7","unstructured":"Frequently asked questions: data file formats. Genome Browser https:\/\/genome.ucsc.edu\/FAQ\/FAQformat.html (2021)."},{"key":"85_CR8","doi-asserted-by":"publisher","unstructured":"Koranne, S. Handbook of Open Source Tools 191\u2013200 (Springer, 2011); https:\/\/doi.org\/10.1007\/978-1-4419-7719-9_10","DOI":"10.1007\/978-1-4419-7719-9_10"},{"key":"85_CR9","doi-asserted-by":"publisher","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","volume":"25","author":"H Li","year":"2009","unstructured":"Li, H. et al. The Sequence Alignment\/Map format and SAMtools. Bioinformatics 25, 2078\u20132079 (2009).","journal-title":"Bioinformatics"},{"key":"85_CR10","doi-asserted-by":"publisher","first-page":"734","DOI":"10.1101\/gr.114819.110","volume":"21","author":"MH-Y Fritz","year":"2011","unstructured":"Fritz, M. H.-Y., Leinonen, R., Cochrane, G. & Birney, E. Efficient storage of high throughput DNA sequencing data using reference-based compression. Genome Res. 21, 734\u2013740 (2011).","journal-title":"Genome Res."},{"key":"85_CR11","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1145\/182590.182453","volume":"VII","author":"Z Shao","year":"1994","unstructured":"Shao, Z., Reppy, J. H. & Appel, A. W. Unrolling lists. SIGPLAN Lisp Pointers VII, 185\u2013195 (1994).","journal-title":"SIGPLAN Lisp Pointers"},{"key":"85_CR12","doi-asserted-by":"publisher","first-page":"867","DOI":"10.1093\/bioinformatics\/btx699","volume":"34","author":"BS Pedersen","year":"2018","unstructured":"Pedersen, B. S. & Quinlan, A. R. mosdepth: quick coverage calculation for genomes and exomes. Bioinformatics 34, 867\u2013868 (2018).","journal-title":"Bioinformatics"},{"key":"85_CR13","unstructured":"The SAM\/BAM Format Specification Working Group Sequence Alignment\/Map Format Specification (GitHub, 2021); http:\/\/samtools.github.io\/hts-specs\/SAMv1.pdf"},{"key":"85_CR14","doi-asserted-by":"publisher","first-page":"btv561","DOI":"10.1093\/bioinformatics\/btv561","volume":"32","author":"Z Wang","year":"2015","unstructured":"Wang, Z., Weissman, T. & Milenkovic, O. smallWig: parallel compression of RNA-seq WIG files. Bioinformatics 32, btv561 (2015).","journal-title":"Bioinformatics"},{"key":"85_CR15","doi-asserted-by":"publisher","first-page":"2843","DOI":"10.1093\/bioinformatics\/btu356","volume":"30","author":"H Li","year":"2014","unstructured":"Li, H. Toward better understanding of artifacts in variant calling from high-coverage samples. Bioinformatics 30, 2843\u20132851 (2014).","journal-title":"Bioinformatics"},{"key":"85_CR16","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1038\/nature11247","volume":"489","author":"ENCODE Project Consortium","year":"2012","unstructured":"ENCODE Project Consortium An integrated encyclopedia of DNA elements in the human genome. Nature 489, 57\u201374 (2012).","journal-title":"Nature"},{"key":"85_CR17","doi-asserted-by":"publisher","unstructured":"Hou, H., Quinlan, A. & Pedersen, B. Efficient analysis of quantitative genomics data with the D4 format. Zenodo https:\/\/doi.org\/10.5281\/ZENODO.4684595 (2021).","DOI":"10.5281\/ZENODO.4684595"}],"updated-by":[{"DOI":"10.1038\/s43588-022-00211-6","type":"correction","label":"Correction","source":"publisher","updated":{"date-parts":[[2022,2,15]],"date-time":"2022-02-15T00:00:00Z","timestamp":1644883200000}}],"container-title":["Nature Computational Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s43588-021-00085-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-021-00085-0","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-021-00085-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,3]],"date-time":"2022-12-03T16:27:24Z","timestamp":1670084844000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s43588-021-00085-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,21]]},"references-count":17,"journal-issue":{"issue":"6","published-online":{"date-parts":[[2021,6]]}},"alternative-id":["85"],"URL":"https:\/\/doi.org\/10.1038\/s43588-021-00085-0","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2020.10.23.352567","asserted-by":"object"}]},"ISSN":["2662-8457"],"issn-type":[{"value":"2662-8457","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,6,21]]},"assertion":[{"value":"4 December 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 May 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 June 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 February 2022","order":4,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Correction","order":5,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"A Correction to this paper has been published:","order":6,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"https:\/\/doi.org\/10.1038\/s43588-022-00211-6","URL":"https:\/\/doi.org\/10.1038\/s43588-022-00211-6","order":7,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}