{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T01:14:29Z","timestamp":1774746869351,"version":"3.50.1"},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"1","funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["No. 91130008 and No.11201460"],"award-info":[{"award-number":["No. 91130008 and No.11201460"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"The Strategic Priority Research Program of the Chinese Academy of Sciences","award":["No. XDB13040600"],"award-info":[{"award-number":["No. XDB13040600"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["No. 11571349 and No. 11201460"],"award-info":[{"award-number":["No. 11571349 and No. 11201460"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004739","name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004739","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s12859-017-1743-4","type":"journal-article","created":{"date-parts":[[2017,7,11]],"date-time":"2017-07-11T09:32:47Z","timestamp":1499765567000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Estimating Phred scores of Illumina base calls by logistic regression and sparse modeling"],"prefix":"10.1186","volume":"18","author":[{"given":"Sheng","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Bo","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Lin","family":"Wan","sequence":"additional","affiliation":[]},{"given":"Lei M.","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,7,11]]},"reference":[{"key":"1743_CR1","doi-asserted-by":"crossref","first-page":"387","DOI":"10.1146\/annurev.genom.9.081307.164359","volume":"9","author":"ER Mardis","year":"2008","unstructured":"Mardis ER. Next-generation dna sequencing methods. Annu Rev Genomics Hum Genet. 2008; 9:387\u2013402.","journal-title":"Annu Rev Genomics Hum Genet"},{"issue":"3","key":"1743_CR2","doi-asserted-by":"crossref","first-page":"186","DOI":"10.1101\/gr.8.3.186","volume":"8","author":"B Ewing","year":"1998","unstructured":"Ewing B, Green P. Base-calling of automated sequencer traces using Phred. ii. error probabilities. Genome Res. 1998; 8(3):186\u201394.","journal-title":"Genome Res"},{"issue":"1","key":"1743_CR3","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1038\/nmeth.2276","volume":"10","author":"NA Bokulich","year":"2013","unstructured":"Bokulich NA, Subramanian S, Faith JJ, Gevers D, Gordon JI, Knight RT, Mills DA, Caporaso JG. Quality-filtering vastly improves diversity estimates from Illumina amplicon sequencing. Nat Methods. 2013; 10(1):57\u20139.","journal-title":"Nat Methods"},{"key":"1743_CR4","unstructured":"HCS 1.4\/RTA 1.12 Theory of Operation. Illumina Inc. http:\/\/www.illumina.com\/Documents\/products\/technotes\/technote_rta_theory_operations.pdf . Accessed 20 July 2016."},{"key":"1743_CR5","doi-asserted-by":"crossref","first-page":"41348","DOI":"10.1038\/srep41348","volume":"7","author":"B Wang","year":"2017","unstructured":"Wang B, Wan L, Wang A, Li LM. An adaptive decorrelation method removes Illumina DNA base-calling errors caused by crosstalk between adjacent clusters. Sci Rep. 2017; 7:41348.","journal-title":"Sci Rep"},{"key":"1743_CR6","volume-title":"Applied Logistic Regression","author":"DW Hosmer Jr","year":"2004","unstructured":"Hosmer Jr DW, Lemeshow S. Applied Logistic Regression. Hoboken: Wiley; 2004."},{"key":"1743_CR7","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4899-3242-6","volume-title":"Generalized Linear Models. vol. 37.","author":"P Mccullagh","year":"1989","unstructured":"Mccullagh P, Nelder JA. Generalized Linear Models. vol. 37. 2nd ed. London: Chapman and Hall; 1989."},{"issue":"4","key":"1743_CR8","doi-asserted-by":"crossref","first-page":"531","DOI":"10.1137\/1037125","volume":"37","author":"TJ Ypma","year":"1995","unstructured":"Ypma TJ. Historical development of the Newton-Raphson method. SIAM Rev. 1995; 37(4):531\u201351.","journal-title":"SIAM Rev"},{"issue":"16","key":"1743_CR9","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1093\/nar\/gkn425","volume":"36","author":"JC Dohm","year":"2008","unstructured":"Dohm JC, Lottaz C, Borodina T, Himmelbauer H. Substantial biases in ultra-short read data sets from high-throughput dna sequencing. Nucleic Acids Res. 2008; 36(16):105.","journal-title":"Nucleic Acids Res"},{"issue":"11","key":"1743_CR10","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/gb-2011-12-11-r112","volume":"12","author":"AE Minoche","year":"2011","unstructured":"Minoche AE, Dohm JC, Himmelbauer H. Evaluation of genomic high-throughput sequencing data generated on Illumina hiseq and genome analyzer systems. Genome Biol. 2011; 12(11):1\u201315.","journal-title":"Genome Biol"},{"key":"1743_CR11","doi-asserted-by":"crossref","DOI":"10.1201\/b17758","volume-title":"Sparse Modeling: Theory, Algorithms, and Applications","author":"I Rish","year":"2014","unstructured":"Rish I, Grabarnik G. Sparse Modeling: Theory, Algorithms, and Applications. Beaverton: CRC Press, Inc; 2014."},{"issue":"1","key":"1743_CR12","doi-asserted-by":"crossref","first-page":"27","DOI":"10.1007\/BF01666516","volume":"2","author":"H An","year":"1985","unstructured":"An H, Gu L. On the selection of regression variables. Acta Math Applicatae Sin. 1985; 2(1):27\u201336.","journal-title":"Acta Math Applicatae Sin"},{"key":"1743_CR13","first-page":"583","volume":"7","author":"A Chakrabarti","year":"2011","unstructured":"Chakrabarti A, Ghosh JK. AIC, BIC, and recent advances in model selection. Handbook of the philosophy of science. 2011; 7:583\u2013605.","journal-title":"Handbook of the philosophy of science"},{"key":"1743_CR14","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1111\/j.2517-6161.1996.tb02080.x","volume":"58","author":"RJ Tibshirani","year":"1996","unstructured":"Tibshirani RJ. Regression shrinkage and selection via the lasso. J R Stat Soc. 1996; 58:267\u201388.","journal-title":"J R Stat Soc"},{"issue":"1","key":"1743_CR15","doi-asserted-by":"crossref","first-page":"1","DOI":"10.18637\/jss.v033.i01","volume":"33","author":"J Friedman","year":"2010","unstructured":"Friedman J, Hastie T, Tibshirani R. Regularization paths for generalized linear models via coordinate descent. J Stat Softw. 2010; 33(1):1\u201322.","journal-title":"J Stat Softw"},{"issue":"17","key":"1743_CR16","doi-asserted-by":"crossref","first-page":"5183","DOI":"10.1093\/nar\/gkh850","volume":"32","author":"M Li","year":"2004","unstructured":"Li M, Nordborg M, Li LM. Adjust quality scores from alignment and improve sequencing accuracy. Nucleic Acids Res. 2004; 32(17):5183\u201391.","journal-title":"Nucleic Acids Res"},{"issue":"13","key":"1743_CR17","doi-asserted-by":"crossref","first-page":"5541","DOI":"10.1021\/jp951507c","volume":"100","author":"CAM Seidel","year":"1996","unstructured":"Seidel CAM, And AS, Sauer MHM. Nucleobase-specific quenching of fluorescent dyes. 1. nucleobase one-electron redox potentials and their correlation with static and dynamic quenching efficiencies. J Phys Chem. 1996; 100(13):5541\u201353.","journal-title":"J Phys Chem"},{"issue":"9","key":"1743_CR18","doi-asserted-by":"crossref","first-page":"1214","DOI":"10.1093\/bioinformatics\/btu010","volume":"30","author":"C Ye","year":"2014","unstructured":"Ye C, Hsiao C, Corrada BH. Blindcall: ultra-fast base-calling of high-throughput sequencing data by blind deconvolution. Bioinformatics. 2014; 30(9):1214\u20139.","journal-title":"Bioinformatics"},{"key":"1743_CR19","unstructured":"Bravo HC. Research Webpage. http:\/\/www.cbcb.umd.edu\/%7Ehcorrada\/secgen . Accessed 20 July 2016."},{"key":"1743_CR20","volume-title":"R: A Language and Environment for Statistical Computing","author":"R Core Team","year":"2017","unstructured":"R Core Team. R: A Language and Environment for Statistical Computing. Vienna: R Foundation for Statistical Computing; 2017. R Foundation for Statistical Computing. https:\/\/www.R-project.org\/ ."},{"key":"1743_CR21","volume-title":"Statistics","author":"JT Mcclave","year":"2000","unstructured":"Mcclave JT, Sincich T. Statistics, 8th, annotat instructor\u2019s edn. Upper Saddler River: Prentice Hall; 2000."},{"issue":"2","key":"1743_CR22","doi-asserted-by":"crossref","first-page":"301","DOI":"10.1111\/j.1467-9868.2005.00503.x","volume":"67","author":"H Zou","year":"2005","unstructured":"Zou H, Hastie T. Regularization and variable selection via the elastic net. J R Stat Soc Ser B Stat Methodol. 2005; 67(2):301\u201320.","journal-title":"J R Stat Soc Ser B Stat Methodol"},{"issue":"12","key":"1743_CR23","first-page":"1871","volume":"9","author":"RE Fan","year":"2010","unstructured":"Fan RE, Chang KW, Hsieh CJ, Wang XR, Lin CJ. Liblinear: A library for large linear classification. J Mach Learn Res. 2010; 9(12):1871\u20134.","journal-title":"J Mach Learn Res"},{"issue":"1","key":"1743_CR24","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","volume":"143","author":"JA Hanley","year":"1982","unstructured":"Hanley JA, Mcneil BJ. The meaning and use of the area under a receiver operating characteristic (roc) curve. Radiology. 1982; 143(1):29\u201336.","journal-title":"Radiology"},{"issue":"9","key":"1743_CR25","doi-asserted-by":"crossref","first-page":"1297","DOI":"10.1101\/gr.107524.110","volume":"20","author":"A McKenna","year":"2010","unstructured":"McKenna A, Hanna M, Banks E, Sivachenko A, Cibulskis K, Kernytsky A, Garimella K, Altshuler D, Gabriel S, Daly M, DePristo MA. The Genome Analysis Toolkit: A MapReduce framework for analyzing next-generation DNA sequencing data. Genome Res. 2010; 20(9):1297\u2013303.","journal-title":"Genome Res"},{"issue":"16","key":"1743_CR26","doi-asserted-by":"crossref","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","volume":"25","author":"H Li","year":"2009","unstructured":"Li H, Handsaker B, Wysoker A, Fennell T, Ruan J, Homer N, Marth G, Abecasis G, Durbin R. The Sequence Alignment\/Map format and SAMtools. Bioinformatics. 2009; 25(16):2078\u201379.","journal-title":"Bioinformatics"},{"issue":"12","key":"1743_CR27","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1371\/journal.pone.0085024","volume":"8","author":"C Del Fabbro","year":"2013","unstructured":"Del Fabbro C, Scalabrin S, Morgante M, Giorgi FM. An extensive evaluation of read trimming effects on illumina NGS data analysis. PLoS ONE. 2013; 8(12):1\u201313.","journal-title":"PLoS ONE"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-017-1743-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,25]],"date-time":"2024-06-25T10:42:30Z","timestamp":1719312150000},"score":1,"resource":{"primary":{"URL":"http:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-017-1743-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,7,11]]},"references-count":27,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["1743"],"URL":"https:\/\/doi.org\/10.1186\/s12859-017-1743-4","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,7,11]]},"article-number":"335"}}