{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T18:10:20Z","timestamp":1772820620069,"version":"3.50.1"},"reference-count":70,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T00:00:00Z","timestamp":1769472000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T00:00:00Z","timestamp":1772755200000},"content-version":"vor","delay-in-days":38,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"NIH","award":["R01 AI163742"],"award-info":[{"award-number":["R01 AI163742"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/s12859-025-06298-8","type":"journal-article","created":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T08:34:56Z","timestamp":1769502896000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Integration of bulk RNA-seq pipeline metrics for assessing low-quality samples"],"prefix":"10.1186","volume":"27","author":[{"given":"Samuel","family":"Hamilton","sequence":"first","affiliation":[]},{"given":"Gaurav","family":"Gadhvi","sequence":"additional","affiliation":[]},{"given":"Tyler","family":"Therron","sequence":"additional","affiliation":[]},{"given":"Deborah R.","family":"Winter","sequence":"additional","affiliation":[]},{"name":"SCRIPT Investigators","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,27]]},"reference":[{"issue":"18","key":"6298_CR1","doi-asserted-by":"publisher","first-page":"2598","DOI":"10.1093\/bioinformatics\/btr441","volume":"27","author":"Y Wang","year":"2011","unstructured":"Wang Y, Mehta G, Mayani R, Lu J, Souaiaia T, Chen Y, et al. RseqFlow: workflows for RNA-Seq data analysis. Bioinformatics. 2011;27(18):2598\u2013600.","journal-title":"Bioinformatics"},{"issue":"12","key":"6298_CR2","doi-asserted-by":"publisher","first-page":"480","DOI":"10.1186\/1471-2105-12-480","volume":"17","author":"D Risso","year":"2011","unstructured":"Risso D, Schwartz K, Sherlock G, Dudoit S. GC-content normalization for RNA-Seq data. BMC Bioinformatics. 2011;17(12):480.","journal-title":"BMC Bioinformatics"},{"issue":"9","key":"6298_CR3","doi-asserted-by":"publisher","first-page":"1543","DOI":"10.1101\/gr.121095.111","volume":"21","author":"L Jiang","year":"2011","unstructured":"Jiang L, Schlesinger F, Davis CA, Zhang Y, Li R, Salit M, et al. Synthetic spike-in standards for RNA-seq experiments. Genome Res. 2011;21(9):1543\u201351.","journal-title":"Genome Res"},{"issue":"18","key":"6298_CR4","doi-asserted-by":"publisher","first-page":"3683","DOI":"10.1093\/bioinformatics\/bti605","volume":"21","author":"CL Wilson","year":"2005","unstructured":"Wilson CL, Miller CJ. Simpleaffy: a BioConductor package for affymetrix quality control and data analysis. Bioinformatics. 2005;21(18):3683\u20135.","journal-title":"Bioinformatics"},{"issue":"7","key":"6298_CR5","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1186\/1471-2105-7-276","volume":"2","author":"MJ Okoniewski","year":"2006","unstructured":"Okoniewski MJ, Miller CJ. Hybridization interactions between probesets in short oligo microarrays lead to spurious correlations. BMC Bioinform. 2006;2(7):276.","journal-title":"BMC Bioinform"},{"issue":"3","key":"6298_CR6","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1016\/j.ygeno.2010.01.003","volume":"95","author":"A Kauffmann","year":"2010","unstructured":"Kauffmann A, Huber W. Microarray data quality control improves the detection of differentially expressed genes. Genomics. 2010;95(3):138\u201342.","journal-title":"Genomics"},{"issue":"1","key":"6298_CR7","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1038\/nrg2484","volume":"10","author":"Z Wang","year":"2009","unstructured":"Wang Z, Gerstein M, Snyder M. RNA-Seq: a revolutionary tool for transcriptomics. Nat Rev Genet. 2009;10(1):57\u201363.","journal-title":"Nat Rev Genet"},{"issue":"12","key":"6298_CR8","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1186\/1741-7007-12-42","volume":"30","author":"I Gallego Romero","year":"2014","unstructured":"Gallego Romero I, Pai AA, Tung J, Gilad Y. RNA-seq: impact of RNA degradation on transcript quantification. BMC Biol. 2014;30(12):42.","journal-title":"BMC Biol"},{"issue":"1","key":"6298_CR9","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1038\/nrg3655","volume":"15","author":"K Robasky","year":"2014","unstructured":"Robasky K, Lewis NE, Church GM. The role of replicates for error mitigation in next-generation sequencing. Nat Rev Genet. 2014;15(1):56\u201362.","journal-title":"Nat Rev Genet"},{"issue":"9","key":"6298_CR10","doi-asserted-by":"publisher","first-page":"879","DOI":"10.1038\/nmeth.3091","volume":"11","author":"P Blainey","year":"2014","unstructured":"Blainey P, Krzywinski M, Altman N. Replication. Nat Methods. 2014;11(9):879\u201380.","journal-title":"Nat Methods"},{"issue":"9","key":"6298_CR11","doi-asserted-by":"publisher","first-page":"879","DOI":"10.1038\/nmeth.3091","volume":"11","author":"P Blainey","year":"2014","unstructured":"Blainey P, Krzywinski M, Altman N. Points of significance: replication. Nat Methods. 2014;11(9):879\u201380.","journal-title":"Nat Methods"},{"issue":"2","key":"6298_CR12","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1534\/genetics.110.114983","volume":"185","author":"PL Auer","year":"2010","unstructured":"Auer PL, Doerge RW. Statistical design and analysis of RNA sequencing data. Genetics. 2010;185(2):405\u201316.","journal-title":"Genetics"},{"issue":"3","key":"6298_CR13","doi-asserted-by":"publisher","first-page":"40","DOI":"10.4103\/2153-3539.103013","volume":"31","author":"RR Gullapalli","year":"2012","unstructured":"Gullapalli RR, Desai KV, Santana-Santos L, Kant JA, Becich MJ. Next generation sequencing in clinical medicine: challenges and lessons for pathology and biomedical informatics. J Pathol Inform. 2012;31(3):40.","journal-title":"J Pathol Inform"},{"issue":"3","key":"6298_CR14","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pmed.1001779","volume":"12","author":"C Sudlow","year":"2015","unstructured":"Sudlow C, Gallacher J, Allen N, Beral V, Burton P, Danesh J, et al. UK biobank: an open access resource for identifying the causes of a wide range of complex diseases of middle and old age. PLoS Med. 2015;12(3):e1001779.","journal-title":"PLoS Med"},{"issue":"2","key":"6298_CR15","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1016\/j.cell.2018.03.042","volume":"173","author":"C Hutter","year":"2018","unstructured":"Hutter C, Zenklusen JC. The cancer genome atlas: creating lasting value beyond its data. Cell. 2018;173(2):283\u20135.","journal-title":"Cell"},{"issue":"11","key":"6298_CR16","doi-asserted-by":"publisher","first-page":"1046","DOI":"10.1038\/nmeth.2238","volume":"9","author":"N de Souza","year":"2012","unstructured":"de Souza N. The ENCODE project. Nat Methods. 2012;9(11):1046.","journal-title":"Nat Methods"},{"issue":"12","key":"6298_CR17","doi-asserted-by":"publisher","first-page":"1375","DOI":"10.3390\/medicina57121375","volume":"57","author":"K Masago","year":"2021","unstructured":"Masago K, Fujita S, Oya Y, Takahashi Y, Matsushita H, Sasaki E, et al. Comparison between Fluorimetry (Qubit) and Spectrophotometry (NanoDrop) in the quantification of DNA and RNA extracted from Frozen and FFPE tissues from lung cancer patients: a real-world use of genomic tests. Medicina. 2021;57(12):1375.","journal-title":"Medicina"},{"key":"6298_CR18","first-page":"1","volume":"1","author":"O Mueller","year":"2004","unstructured":"Mueller O, Lightfoot S, Schroeder A. RNA integrity number (RIN)\u2013standardization of RNA quality control. Agilent Appl Note Publ. 2004;1:1\u20138.","journal-title":"Agilent Appl Note Publ"},{"issue":"7","key":"6298_CR19","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1471-2199-7-3","volume":"31","author":"A Schroeder","year":"2006","unstructured":"Schroeder A, Mueller O, Stocker S, Salowsky R, Leiber M, Gassmann M, et al. The RIN: an RNA integrity number for assigning integrity values to RNA measurements. BMC Mol Biol. 2006;31(7):3.","journal-title":"BMC Mol Biol"},{"issue":"1","key":"6298_CR20","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1038\/ng0104-106a","volume":"36","author":"H Auer","year":"2004","unstructured":"Auer H, Lyianarachchi S, Newsom D, Klisovic MI, Marcucci G, Kornacker K. Erratum: chipping away at the chip bias: RNA degradation in microarray analysis. Nat Genet. 2004;36(1):106\u2013106.","journal-title":"Nat Genet"},{"issue":"6","key":"6298_CR21","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gni054","volume":"33","author":"S Imbeaud","year":"2005","unstructured":"Imbeaud S, Graudens E, Boulanger V, Barlet X, Zaborski P, Eveno E, et al. Towards standardization of RNA quality assessment using user-independent classifiers of microcapillary electrophoresis traces. Nucleic Acids Res. 2005;33(6):e56.","journal-title":"Nucleic Acids Res"},{"issue":"6","key":"6298_CR22","doi-asserted-by":"publisher","first-page":"1767","DOI":"10.1093\/nar\/gkp1137","volume":"38","author":"PJA Cock","year":"2010","unstructured":"Cock PJA, Fields CJ, Goto N, Heuer ML, Rice PM. The sanger FASTQ file format for sequences with quality scores, and the solexa\/illumina FASTQ variants. Nucl Acids Res. 2010;38(6):1767\u201371.","journal-title":"Nucl Acids Res"},{"key":"6298_CR23","unstructured":"Andrews S, Others. FastQC: a quality control tool for high throughput sequence data. Babraham Bioinformatics, Babraham Institute, Cambridge, United Kingdom; 2010."},{"issue":"14","key":"6298_CR24","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1186\/1471-2105-14-33","volume":"31","author":"X Yang","year":"2013","unstructured":"Yang X, Liu D, Liu F, Wu J, Zou J, Xiao X, et al. HTQC: a fast quality control toolkit for Illumina sequencing data. BMC Bioinform. 2013;31(14):33.","journal-title":"BMC Bioinform"},{"issue":"15","key":"6298_CR25","doi-asserted-by":"publisher","first-page":"2114","DOI":"10.1093\/bioinformatics\/btu170","volume":"30","author":"AM Bolger","year":"2014","unstructured":"Bolger AM, Lohse M, Usadel B. Trimmomatic: a flexible trimmer for Illumina sequence data. Bioinformatics. 2014;30(15):2114\u201320.","journal-title":"Bioinformatics"},{"issue":"10","key":"6298_CR26","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0185056","volume":"12","author":"B Bushnell","year":"2017","unstructured":"Bushnell B, Rood J, Singer E. BBMerge\u2014accurate paired shotgun read merging via overlap. PLoS ONE. 2017;12(10):e0185056.","journal-title":"PLoS ONE"},{"issue":"1","key":"6298_CR27","doi-asserted-by":"publisher","first-page":"10","DOI":"10.14806\/ej.17.1.200","volume":"17","author":"M Martin","year":"2011","unstructured":"Martin M. Cutadapt removes adapter sequences from high-throughput sequencing reads. EMBnet J. 2011;17(1):10.","journal-title":"EMBnet J"},{"issue":"12","key":"6298_CR28","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0085024","volume":"8","author":"C Del Fabbro","year":"2013","unstructured":"Del Fabbro C, Scalabrin S, Morgante M, Giorgi FM. An extensive evaluation of read trimming effects on Illumina NGS data analysis. PLoS ONE. 2013;8(12):e85024.","journal-title":"PLoS ONE"},{"issue":"9","key":"6298_CR29","doi-asserted-by":"publisher","first-page":"1105","DOI":"10.1093\/bioinformatics\/btp120","volume":"25","author":"C Trapnell","year":"2009","unstructured":"Trapnell C, Pachter L, Salzberg SL. TopHat: discovering splice junctions with RNA-Seq. Bioinformatics. 2009;25(9):1105\u201311.","journal-title":"Bioinformatics"},{"issue":"1","key":"6298_CR30","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1093\/bioinformatics\/bts635","volume":"29","author":"A Dobin","year":"2013","unstructured":"Dobin A, Davis CA, Schlesinger F, Drenkow J, Zaleski C, Jha S, et al. STAR: ultrafast universal RNA-seq aligner. Bioinformatics. 2013;29(1):15\u201321.","journal-title":"Bioinformatics"},{"issue":"2","key":"6298_CR31","doi-asserted-by":"publisher","first-page":"166","DOI":"10.1093\/bioinformatics\/btu638","volume":"31","author":"S Anders","year":"2015","unstructured":"Anders S, Pyl PT, Huber W. HTSeq\u2013a Python framework to work with high-throughput sequencing data. Bioinformatics. 2015;31(2):166\u20139.","journal-title":"Bioinformatics"},{"issue":"7","key":"6298_CR32","doi-asserted-by":"publisher","first-page":"923","DOI":"10.1093\/bioinformatics\/btt656","volume":"30","author":"Y Liao","year":"2014","unstructured":"Liao Y, Smyth GK, Shi W. featureCounts: an efficient general purpose program for assigning sequence reads to genomic features. Bioinformatics. 2014;30(7):923\u201330.","journal-title":"Bioinformatics"},{"issue":"16","key":"6298_CR33","doi-asserted-by":"publisher","first-page":"2184","DOI":"10.1093\/bioinformatics\/bts356","volume":"15;28","author":"L Wang","year":"2012","unstructured":"Wang L, Wang S, Li W. RSeQC: quality control of RNA-seq experiments. Bioinformatics. 2012;15;28(16):2184\u20135.","journal-title":"Bioinformatics"},{"issue":"1","key":"6298_CR34","doi-asserted-by":"publisher","first-page":"366","DOI":"10.1186\/s12859-014-0366-2","volume":"15","author":"C-C Lo","year":"2014","unstructured":"Lo C-C, Chain PSG. Rapid evaluation and quality control of next generation sequencing data with FaQCs. BMC Bioinform. 2014;15(1):366.","journal-title":"BMC Bioinform"},{"key":"6298_CR35","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btz854","author":"C Prieto","year":"2019","unstructured":"Prieto C, Barrios D. Rana-seq: interactive rna-seq analysis from fastq files to functional analysis. Bioinformatics. 2019. https:\/\/doi.org\/10.1093\/bioinformatics\/btz854.","journal-title":"Bioinformatics"},{"issue":"Suppl 3","key":"6298_CR36","first-page":"7","volume":"13","author":"KW Kroll","year":"2014","unstructured":"Kroll KW, Mokaram NE, Pelletier AR, Frankhouser DE, Westphal MS, Stump PA, et al. Quality Control for RNA-Seq (QuaCRS): an integrated quality control pipeline. Cancer Inform. 2014;13(Suppl 3):7\u201314.","journal-title":"Cancer Inform"},{"issue":"19","key":"6298_CR37","doi-asserted-by":"publisher","first-page":"3047","DOI":"10.1093\/bioinformatics\/btw354","volume":"32","author":"P Ewels","year":"2016","unstructured":"Ewels P, Magnusson M, Lundin S, K\u00e4ller M. MultiQC: summarize analysis results for multiple tools and samples in a single report. Bioinformatics. 2016;32(19):3047\u20138.","journal-title":"Bioinformatics"},{"issue":"9","key":"6298_CR38","doi-asserted-by":"publisher","first-page":"888","DOI":"10.1038\/nbt.3000","volume":"32","author":"S Li","year":"2014","unstructured":"Li S, \u0141abaj PP, Zumbo P, Sykacek P, Shi W, Shi L, et al. Detecting and correcting systematic variation in large-scale RNA sequencing data. Nat Biotechnol. 2014;32(9):888\u201395.","journal-title":"Nat Biotechnol"},{"issue":"17","key":"6298_CR39","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1186\/s12859-016-0922-z","volume":"3","author":"L Wang","year":"2016","unstructured":"Wang L, Nie J, Sicotte H, Li Y, Eckel-Passow JE, Dasari S, et al. Measure transcript integrity using RNA-seq data. BMC Bioinform. 2016;3(17):58.","journal-title":"BMC Bioinform"},{"key":"6298_CR40","unstructured":"Hamilton S, Gadhvi G, Winter DR. QC-DR [Internet]. GitHub. 2025. Accessed 19 June 2025. Available from: https:\/\/github.com\/DRWinterisCoding\/QCDR"},{"issue":"7847","key":"6298_CR41","doi-asserted-by":"publisher","first-page":"635","DOI":"10.1038\/s41586-020-03148-w","volume":"590","author":"RA Grant","year":"2021","unstructured":"Grant RA, Morales-Nebreda L, Markov NS, Swaminathan S, Querrey M, Guzman ER, et al. Circuits between infected macrophages and T cells in SARS-CoV-2 pneumonia. Nature. 2021;590(7847):635\u201341.","journal-title":"Nature"},{"key":"6298_CR42","first-page":"307","volume-title":"Zhang C","author":"Y Qi","year":"2012","unstructured":"Qi Y. Random Forest for Bioinformatics. In: Ma Y, editor. Zhang C. Methods and Applications. New York Springer: Ensemble Machine Learning; 2012. p. 307\u201323."},{"issue":"1","key":"6298_CR43","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L. Random Forests. Mach Learn. 2001;45(1):5\u201332.","journal-title":"Mach Learn"},{"issue":"1","key":"6298_CR44","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1186\/s12879-023-08931-4","volume":"24","author":"L Cai","year":"2024","unstructured":"Cai L, Zuo X, Ma L, Zhang Y, Xu F, Lu B. Associations of MMP9 polymorphism with the risk of severe pneumonia in a Southern Chinese children population. BMC Infect Dis. 2024;24(1):19.","journal-title":"BMC Infect Dis"},{"issue":"4","key":"6298_CR45","doi-asserted-by":"publisher","first-page":"L445","DOI":"10.1152\/ajplung.00217.2022","volume":"324","author":"C Sul","year":"2023","unstructured":"Sul C, Lewis C, Dee N, Burns N, Oshima K, Schmidt E, et al. Release of extracellular superoxide dismutase into alveolar fluid protects against acute lung injury and inflammation in Staphylococcus aureus pneumonia. Am J Physiol Lung Cell Mol Physiol. 2023;324(4):L445\u201355.","journal-title":"Am J Physiol Lung Cell Mol Physiol"},{"issue":"17","key":"6298_CR46","doi-asserted-by":"publisher","first-page":"9366","DOI":"10.3390\/ijms22179366","volume":"22","author":"A Lubkowska","year":"2021","unstructured":"Lubkowska A, Pluta W, Stro\u0144ska A, Lalko A. Role of heat shock proteins (HSP70 and HSP90) in viral infection. Int J Mol Sci. 2021;22(17):9366.","journal-title":"Int J Mol Sci"},{"issue":"68","key":"6298_CR47","doi-asserted-by":"publisher","first-page":"eabf2846","DOI":"10.1126\/sciimmunol.abf2846","volume":"7","author":"DP Simmons","year":"2022","unstructured":"Simmons DP, Nguyen HN, Gomez-Rivas E, Jeong Y, Jonsson AH, Chen AF, et al. SLAMF7 engagement superactivates macrophages in acute and chronic inflammation. Sci Immunol. 2022;7(68):eabf2846.","journal-title":"Sci Immunol."},{"issue":"12","key":"6298_CR48","doi-asserted-by":"publisher","first-page":"1517","DOI":"10.1164\/rccm.201712-2410OC","volume":"199","author":"PA Reyfman","year":"2019","unstructured":"Reyfman PA, Walter JM, Joshi N, Anekalla KR, McQuattie-Pimentel AC, Chiu S, et al. Single-cell transcriptomic analysis of human lung provides insights into the pathobiology of pulmonary fibrosis. Am J Respir Crit Care Med. 2019;199(12):1517\u201336.","journal-title":"Am J Respir Crit Care Med"},{"issue":"1","key":"6298_CR49","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1186\/s12920-022-01355-0","volume":"15","author":"Y Liu","year":"2022","unstructured":"Liu Y, Bhagwate A, Winham SJ, Stephens MT, Harker BW, McDonough SJ, et al. Quality control recommendations for RNASeq using FFPE samples based on pre-sequencing lab metrics and post-sequencing bioinformatics metrics. BMC Med Genomics. 2022;15(1):195.","journal-title":"BMC Med Genomics"},{"issue":"3","key":"6298_CR50","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1186\/1755-8794-3-36","volume":"9","author":"L Opitz","year":"2010","unstructured":"Opitz L, Salinas-Riester G, Grade M, Jung K, Jo P, Emons G, et al. Impact of RNA degradation on gene expression profiling. BMC Med Genomics. 2010;9(3):36.","journal-title":"BMC Med Genomics"},{"issue":"27","key":"6298_CR51","doi-asserted-by":"publisher","first-page":"7130","DOI":"10.1073\/pnas.1617384114","volume":"114","author":"AE Jaffe","year":"2017","unstructured":"Jaffe AE, Tao R, Norris AL, Kealhofer M, Nellore A, Shin JH, et al. qSVA framework for RNA quality correction in differential expression analysis. Proc Natl Acad Sci USA. 2017;114(27):7130\u20135.","journal-title":"Proc Natl Acad Sci USA"},{"issue":"17","key":"6298_CR52","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1186\/s12859-016-0956-2","volume":"25","author":"CR Williams","year":"2016","unstructured":"Williams CR, Baccarella A, Parrish JZ, Kim CC. Trimming of sequence reads alters RNA-Seq gene expression estimates. BMC Bioinform. 2016;25(17):103.","journal-title":"BMC Bioinform"},{"issue":"10","key":"6298_CR53","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gks001","volume":"40","author":"Y Benjamini","year":"2012","unstructured":"Benjamini Y, Speed TP. Summarizing and correcting the GC content bias in high-throughput sequencing. Nucl Acids Res. 2012;40(10):e72.","journal-title":"Nucl Acids Res"},{"issue":"4","key":"6298_CR54","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pbio.1001046","volume":"9","author":"ENCODE Project Consortium","year":"2011","unstructured":"ENCODE Project Consortium. A user\u2019s guide to the encyclopedia of DNA elements (ENCODE). PLoS Biol. 2011;9(4):e1001046.","journal-title":"PLoS Biol"},{"key":"6298_CR55","doi-asserted-by":"publisher","unstructured":"Albrecht S, Sprang M, Andrade-Navarro MA, Fontaine J-F. seqQscorer: automated quality control of next-generation sequencing data using machine learning [Internet]. Vol. 22, Genome Biology. 2021. Available from: https:\/\/doi.org\/10.1186\/s13059-021-02294-2","DOI":"10.1186\/s13059-021-02294-2"},{"key":"6298_CR56","unstructured":"Bulk RNA-seq data standards and processing pipeline [Internet]. Accessed 30 Sept 2024s. Available from: https:\/\/www.encodeproject.org\/data-standards\/encode4-bulk-rna\/"},{"issue":"4","key":"6298_CR57","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1002\/art.42380","volume":"75","author":"H-KM Makinde","year":"2023","unstructured":"Makinde H-KM, Dunn JLM, Gadhvi G, Carns M, Aren K, Chung AH, et al. Three distinct transcriptional profiles of monocytes associate with disease activity in Scleroderma patients. Arthritis Rheumatol. 2023;75(4):595\u2013608.","journal-title":"Arthritis Rheumatol"},{"issue":"6","key":"6298_CR58","doi-asserted-by":"publisher","first-page":"841","DOI":"10.1002\/art.40453","volume":"70","author":"AM Mandelin 2nd","year":"2018","unstructured":"Mandelin AM 2nd, Homan PJ, Shaffer AM, Cuda CM, Dominguez ST, Bacalao E, et al. Transcriptional profiling of synovial macrophages using minimally invasive ultrasound-guided synovial biopsies in rheumatoid arthritis. Arthritis Rheumatol. 2018;70(6):841\u201354.","journal-title":"Arthritis Rheumatol"},{"key":"6298_CR59","unstructured":"BBMap [Internet]. SourceForge. 2022. Accessed 25 Oct 2023. Available from: https:\/\/sourceforge.net\/projects\/bbmap\/"},{"issue":"16","key":"6298_CR60","doi-asserted-by":"publisher","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","volume":"25","author":"H Li","year":"2009","unstructured":"Li H, Handsaker B, Wysoker A, Fennell T, Ruan J, Homer N, et al. The sequence alignment\/map format and SAMtools. Bioinformatics. 2009;25(16):2078\u20139.","journal-title":"Bioinformatics"},{"key":"6298_CR61","unstructured":"BroadInstitute. Picard [Internet]. http:\/\/picard.sourceforge.net. 2024. Accessed 5 June 2025. Available from: http:\/\/picard.sourceforge.net"},{"issue":"4","key":"6298_CR62","doi-asserted-by":"publisher","first-page":"576","DOI":"10.1016\/j.molcel.2010.05.004","volume":"38","author":"S Heinz","year":"2010","unstructured":"Heinz S, Benner C, Spann N, Bertolino E, Lin YC, Laslo P, et al. Simple combinations of lineage-determining transcription factors prime cis-regulatory elements required for macrophage and B cell identities. Mol Cell. 2010;38(4):576\u201389.","journal-title":"Mol Cell"},{"key":"6298_CR63","doi-asserted-by":"crossref","unstructured":"Irizarry RA. Ggplot2. In: Introduction to data science. Boca Raton: Chapman and Hall\/CRC; 2024. p. 107\u201325.","DOI":"10.1201\/9781003220923-8"},{"key":"6298_CR64","unstructured":"Larsson J. Eulerr: Area-proportional Euler diagrams with ellipses. 2018; Available from: https:\/\/lup.lub.lu.se\/student-papers\/record\/8934042\/file\/8935805.pdf"},{"issue":"6","key":"6298_CR65","doi-asserted-by":"publisher","first-page":"371","DOI":"10.1255\/jnirs.752","volume":"15","author":"M Kaihara","year":"2007","unstructured":"Kaihara M, Kikuchi S. Discriminant analysis of countries growing wakame seaweeds: a preliminary comparison of visible-near infrared spectra using soft independent modelling, Randomforests and classification and regression trees. J Near Infrared Spectrosc. 2007;15(6):371\u20137.","journal-title":"J Near Infrared Spectrosc"},{"issue":"20","key":"6298_CR66","doi-asserted-by":"publisher","first-page":"3940","DOI":"10.1093\/bioinformatics\/bti623","volume":"21","author":"T Sing","year":"2005","unstructured":"Sing T, Sander O, Beerenwinkel N, Lengauer T. ROCR: visualizing classifier performance in R. Bioinformatics. 2005;21(20):3940\u20131.","journal-title":"Bioinformatics"},{"key":"6298_CR67","unstructured":"Breiman L, Cutler A, Liaw A, Wiener M. randomForest [Internet]. CRAN. 2024. Accessed 19 June 2025. Available from: https:\/\/cran.r-project.org\/web\/packages\/randomForest\/index.html"},{"issue":"4","key":"6298_CR68","doi-asserted-by":"publisher","first-page":"1059","DOI":"10.1111\/rssb.12377","volume":"82","author":"DW Apley","year":"2020","unstructured":"Apley DW, Zhu J. Visualizing the effects of predictor variables in black box supervised learning models. J R Stat Soc Ser B Stat Methodol. 2020;82(4):1059\u201386.","journal-title":"J R Stat Soc Ser B Stat Methodol"},{"key":"6298_CR69","unstructured":"Apley D, Zhu J. ALEPlot [Internet]. GitHub. 2020. Accessed 19 June 2025. Available from: https:\/\/github.com\/cran\/ALEPlot"},{"issue":"5","key":"6298_CR70","doi-asserted-by":"publisher","first-page":"284","DOI":"10.1089\/omi.2011.0118","volume":"16","author":"G Yu","year":"2012","unstructured":"Yu G, Wang L-G, Han Y, He Q-Y. clusterProfiler: an R package for comparing biological themes among gene clusters. OMICS. 2012;16(5):284\u20137.","journal-title":"OMICS"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12859-025-06298-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06298-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06298-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T12:03:38Z","timestamp":1772798618000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s12859-025-06298-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,27]]},"references-count":70,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["6298"],"URL":"https:\/\/doi.org\/10.1186\/s12859-025-06298-8","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-6976695\/v1","asserted-by":"object"}]},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,27]]},"assertion":[{"value":"25 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This study involved secondary analysis of publicly available and fully de-identified data; therefore, ethics approval and consent to participate were not required.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"59"}}