{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T20:34:34Z","timestamp":1772138074535,"version":"3.50.1"},"reference-count":32,"publisher":"Oxford University Press (OUP)","issue":"6","license":[{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001350","name":"Singapore Ministry of Health","doi-asserted-by":"crossref","award":["OFIRG21nov-0083"],"award-info":[{"award-number":["OFIRG21nov-0083"]}],"id":[{"id":"10.13039\/501100001350","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,2]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:sec>\n                    <jats:title>Motivation<\/jats:title>\n                    <jats:p>Cell-free DNA (cfDNA) analysis has wide-ranging clinical applications due to its noninvasive nature. However, cfDNA fragmentomics and copy number analysis can be complicated by GC bias. There is a lack of GC correction software based on rigorous cfDNA GC bias analysis. Furthermore, there is no standardized metric for comparing GC bias correction methods across large sample sets, nor a rigorous experiment setup to demonstrate their effectiveness on cfDNA data at various coverage levels.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Results<\/jats:title>\n                    <jats:p>We present GCfix, a method for robust GC bias correction in cfDNA data across diverse coverages. Developed following an in-depth analysis of cfDNA GC bias at the region and fragment length levels, GCfix is both fast and accurate. It works on all reference genomes and generates correction factors, tagged BAM files, and corrected coverage tracks. We also introduce two orthogonal performance metrics for (i) comparing the fragment count density distribution of GC content between expected and corrected samples, and (ii) evaluating coverage profile improvement post-correction. GCfix outperforms existing cfDNA GC bias correction methods on these metrics.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Availability and implementation<\/jats:title>\n                    <jats:p>GCfix software and code for reproducing the figures are publicly accessible on GitHub: https:\/\/github.com\/Rafeed-bot\/GCfix_Software.<\/jats:p>\n                  <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btaf293","type":"journal-article","created":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T08:10:26Z","timestamp":1746778226000},"source":"Crossref","is-referenced-by-count":1,"title":["GCfix: a fast and accurate fragment length-specific method for correcting GC bias in cell-free DNA"],"prefix":"10.1093","volume":"41","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5481-8025","authenticated-orcid":false,"given":"Chowdhury Rafeed","family":"Rahman","sequence":"first","affiliation":[{"name":"Genome Institute of Singapore (GIS), Agency for Science, Technology and Research (A*STAR) , 138672,","place":["Singapore"]},{"name":"School of Computing, National University of Singapore , 117417,","place":["Singapore"]}]},{"given":"Zhong Wee","family":"Poh","sequence":"additional","affiliation":[{"name":"Genome Institute of Singapore (GIS), Agency for Science, Technology and Research (A*STAR) , 138672,","place":["Singapore"]},{"name":"School of Computing, National University of Singapore , 117417,","place":["Singapore"]}]},{"given":"Anders Jacobsen","family":"Skanderup","sequence":"additional","affiliation":[{"name":"Genome Institute of Singapore (GIS), Agency for Science, Technology and Research (A*STAR) , 138672,","place":["Singapore"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1241-5441","authenticated-orcid":false,"given":"Limsoon","family":"Wong","sequence":"additional","affiliation":[{"name":"School of Computing, National University of Singapore , 117417,","place":["Singapore"]}]}],"member":"286","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"2025070408321955900_btaf293-B1","doi-asserted-by":"crossref","first-page":"1324","DOI":"10.1038\/s41467-017-00965-y","article-title":"Scalable whole-exome sequencing of cell-free DNA reveals high concordance with metastatic tumors","volume":"8","author":"Adalsteinsson","year":"2017","journal-title":"Nat Commun"},{"key":"2025070408321955900_btaf293-B2","doi-asserted-by":"crossref","first-page":"R18","DOI":"10.1186\/gb-2011-12-2-r18","article-title":"Analyzing and minimizing PCR amplification bias in illumina sequencing libraries","volume":"12","author":"Aird","year":"2011","journal-title":"Genome Biol"},{"key":"2025070408321955900_btaf293-B3","doi-asserted-by":"crossref","first-page":"e72","DOI":"10.1093\/nar\/gks001","article-title":"Summarizing and correcting the GC content bias in high-throughput sequencing","volume":"40","author":"Benjamini","year":"2012","journal-title":"Nucleic Acids Res"},{"key":"2025070408321955900_btaf293-B4","doi-asserted-by":"crossref","first-page":"268","DOI":"10.1093\/bioinformatics\/btq635","article-title":"Control-free calling of copy number alterations in deep-sequencing data using GC-content normalization","volume":"27","author":"Boeva","year":"2011","journal-title":"Bioinformatics"},{"key":"2025070408321955900_btaf293-B5","doi-asserted-by":"crossref","first-page":"giaa008","DOI":"10.1093\/gigascience\/giaa008","article-title":"GC bias affects genomic and metagenomic reconstructions, underrepresenting GC-poor organisms","volume":"9","author":"Browne","year":"2020","journal-title":"Gigascience"},{"key":"2025070408321955900_btaf293-B6","doi-asserted-by":"crossref","first-page":"2254","DOI":"10.1158\/1078-0432.CCR-18-1593","article-title":"Low-pass whole-genome sequencing of circulating cell-free DNA demonstrates dynamic changes in genomic copy number in a squamous lung cancer clinical cohort","volume":"25","author":"Chen","year":"2019","journal-title":"Clin Cancer Res"},{"key":"2025070408321955900_btaf293-B7","doi-asserted-by":"crossref","first-page":"385","DOI":"10.1038\/s41586-019-1272-6","article-title":"Genome-wide cell-free DNA fragmentation in patients with cancer","volume":"570","author":"Cristiano","year":"2019","journal-title":"Nature"},{"key":"2025070408321955900_btaf293-B8","doi-asserted-by":"crossref","first-page":"7475","DOI":"10.1038\/s41467-022-35076-w","article-title":"A framework for clinical cancer subtyping from nucleosome profiling of cell-free DNA","volume":"13","author":"Doebley","year":"2022","journal-title":"Nat Commun"},{"key":"2025070408321955900_btaf293-B9","doi-asserted-by":"crossref","first-page":"e105","DOI":"10.1093\/nar\/gkn425","article-title":"Substantial biases in ultra-short read data sets from high-throughput DNA sequencing","volume":"36","author":"Dohm","year":"2008","journal-title":"Nucleic Acids Res"},{"key":"2025070408321955900_btaf293-B10","doi-asserted-by":"crossref","first-page":"1858","DOI":"10.1109\/TIT.2003.813506","article-title":"A new metric for probability distributions","volume":"49","author":"Endres","year":"2003","journal-title":"IEEE Trans Inform Theory"},{"key":"2025070408321955900_btaf293-B11","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","article-title":"The meaning and use of the area under a receiver operating characteristic (ROC) curve","volume":"143","author":"Hanley","year":"1982","journal-title":"Radiology"},{"key":"2025070408321955900_btaf293-B12","doi-asserted-by":"crossref","first-page":"e131","DOI":"10.1093\/nar\/gkq224","article-title":"Biases in illumina transcriptome sequencing caused by random hexamer priming","volume":"38","author":"Hansen","year":"2010","journal-title":"Nucleic Acids Res"},{"key":"2025070408321955900_btaf293-B13","doi-asserted-by":"crossref","first-page":"71","DOI":"10.1038\/s41576-018-0071-5","article-title":"Current and future perspectives of liquid biopsies in genomics-driven oncology","volume":"20","author":"Heitzer","year":"2019","journal-title":"Nat Rev Genet"},{"key":"2025070408321955900_btaf293-B14","doi-asserted-by":"crossref","first-page":"89848","DOI":"10.18632\/oncotarget.21163","article-title":"Rapid, ultra low coverage copy number profiling of cell-free DNA as a precision oncology screening strategy","volume":"8","author":"Hovelson","year":"2017","journal-title":"Oncotarget"},{"key":"2025070408321955900_btaf293-B15","doi-asserted-by":"crossref","first-page":"297","DOI":"10.1038\/s41571-020-00457-x","article-title":"Liquid biopsy enters the clinical: implementation issues and future challenges","volume":"18","author":"Ignatiadis","year":"2021","journal-title":"Nat Rev Clin Oncol"},{"key":"2025070408321955900_btaf293-B16","doi-asserted-by":"crossref","first-page":"360","DOI":"10.1016\/j.tig.2016.03.009","article-title":"The long and short of circulating cell-free DNA and the ins and outs of molecular diagnostics","volume":"32","author":"Jiang","year":"2016","journal-title":"Trends Genet"},{"key":"2025070408321955900_btaf293-B17","doi-asserted-by":"crossref","first-page":"291","DOI":"10.1038\/nmeth.1311","article-title":"Amplification-free illumina sequencing-library preparation facilitates improved mapping and assembly of (G+C)-biased genomes","volume":"6","author":"Kozarewa","year":"2009","journal-title":"Nat Methods"},{"key":"2025070408321955900_btaf293-B18","doi-asserted-by":"crossref","first-page":"eaaw3616","DOI":"10.1126\/science.aaw3616","article-title":"Epigenetics, fragmentomics, and topology of cell-free DNA in liquid biopsies","volume":"372","author":"Lo","year":"2021","journal-title":"Science"},{"key":"2025070408321955900_btaf293-B19","doi-asserted-by":"crossref","first-page":"e23418","DOI":"10.1371\/journal.pone.0023418","article-title":"High fragmentation characterizes tumour-derived circulating DNA","volume":"6","author":"Mouliere","year":"2011","journal-title":"PLoS One"},{"key":"2025070408321955900_btaf293-B20","doi-asserted-by":"crossref","first-page":"eaat4921","DOI":"10.1126\/scitranslmed.aat4921","article-title":"Enhanced detection of circulating tumor DNA by fragment size analysis","volume":"10","author":"Mouliere","year":"2018","journal-title":"Sci Transl Med"},{"key":"2025070408321955900_btaf293-B21","doi-asserted-by":"crossref","first-page":"e90","DOI":"10.1093\/nar\/gkr344","article-title":"Sequence-specific error profile of illumina sequencers","volume":"39","author":"Nakamura","year":"2011","journal-title":"Nucleic Acids Res"},{"key":"2025070408321955900_btaf293-B22","doi-asserted-by":"publisher","author":"Poh","year":"2025","DOI":"10.1101\/2025.04.17.649313,"},{"key":"2025070408321955900_btaf293-B23","doi-asserted-by":"crossref","first-page":"1005","DOI":"10.1038\/nmeth.1270","article-title":"A large genome center\u2019s improvements to the illumina sequencing system","volume":"5","author":"Quail","year":"2008","journal-title":"Nat Methods"},{"key":"2025070408321955900_btaf293-B24","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1109\/5.18626","article-title":"A tutorial on hidden Markov models and selected applications in speech recognition","volume":"77","author":"Rabiner","year":"1989","journal-title":"Proc IEEE"},{"key":"2025070408321955900_btaf293-B25","doi-asserted-by":"crossref","first-page":"1605","DOI":"10.1093\/nar\/gky1263","article-title":"WisecondorX: improved copy number detection for routine shallow whole-genome sequencing","volume":"47","author":"Raman","year":"2019","journal-title":"Nucleic Acids Res"},{"key":"2025070408321955900_btaf293-B26","doi-asserted-by":"crossref","first-page":"357","DOI":"10.1186\/s12864-021-07686-z","article-title":"Evaluation of tools for identifying large copy number variations from ultra-low-coverage whole-genome sequencing data","volume":"22","author":"Smolander","year":"2021","journal-title":"BMC Genom"},{"key":"2025070408321955900_btaf293-B27","doi-asserted-by":"crossref","first-page":"lqad102","DOI":"10.1093\/nargab\/lqad102","article-title":"GCparagon: evaluating and correcting GC biases in cell-free DNA at the fragment level","volume":"5","author":"Spiegl","year":"2023","journal-title":"NAR Genom Bioinform"},{"key":"2025070408321955900_btaf293-B28","doi-asserted-by":"crossref","first-page":"1586","DOI":"10.1101\/gr.092981.109","article-title":"Sensitive and accurate detection of copy number variants using read depth of coverage","volume":"19","author":"Yoon","year":"2009","journal-title":"Genome Res"},{"key":"2025070408321955900_btaf293-B29","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1002\/1097-0142(1950)3:1<32::AID-CNCR2820030106>3.0.CO;2-3","article-title":"Index for rating diagnostic tests","volume":"3","author":"Youden","year":"1950","journal-title":"Cancer"},{"key":"2025070408321955900_btaf293-B30","doi-asserted-by":"crossref","first-page":"e674","DOI":"10.1002\/mgg3.674","article-title":"Noninvasive prenatal testing for fetal subchromosomal copy number variations and chromosomal aneuploidy by low-pass whole-genome sequencing","volume":"7","author":"Yu","year":"2019","journal-title":"Mol Genet Genomic Med"},{"key":"2025070408321955900_btaf293-B31","doi-asserted-by":"crossref","first-page":"2229","DOI":"10.1038\/s41467-021-22463-y","article-title":"Tissue-specific cell-free DNA degradation quantifies circulating tumor DNA burden","volume":"12","author":"Zhu","year":"2021","journal-title":"Nat Commun"},{"key":"2025070408321955900_btaf293-B32","first-page":"1","article-title":"A deep-learning model for quantifying circulating tumour DNA from the density distribution of DNA-fragment lengths","author":"Zhu","year":"2025","journal-title":"Nat Biomed Eng"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btaf293\/63155388\/btaf293.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/6\/btaf293\/63155388\/btaf293.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/6\/btaf293\/63155388\/btaf293.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T08:32:31Z","timestamp":1751617951000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btaf293\/8128862"}},"subtitle":[],"editor":[{"given":"Can","family":"Alkan","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2025,5,12]]},"references-count":32,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2025,6,2]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btaf293","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2024.11.07.622399","asserted-by":"object"}]},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2025,6]]},"published":{"date-parts":[[2025,5,12]]},"article-number":"btaf293"}}