{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2023,5,18]],"date-time":"2023-05-18T04:38:27Z","timestamp":1684384707642},"reference-count":33,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2023,3,29]],"date-time":"2023-03-29T00:00:00Z","timestamp":1680048000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,3,29]],"date-time":"2023-03-29T00:00:00Z","timestamp":1680048000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Soft Comput"],"published-print":{"date-parts":[[2023,6]]},"DOI":"10.1007\/s00500-023-08049-4","type":"journal-article","created":{"date-parts":[[2023,3,29]],"date-time":"2023-03-29T10:06:22Z","timestamp":1680084382000},"page":"7813-7829","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Heuristic normalization procedure for batch effect correction"],"prefix":"10.1007","volume":"27","author":[{"given":"Arthur","family":"Yosef","sequence":"first","affiliation":[]},{"given":"Eli","family":"Shnaider","sequence":"additional","affiliation":[]},{"given":"Moti","family":"Schneider","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Gurevich","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,29]]},"reference":[{"key":"8049_CR1","doi-asserted-by":"publisher","first-page":"10101","DOI":"10.1073\/pnas.97.18.10101","volume":"97","author":"O Alter","year":"2000","unstructured":"Alter O, Brown PO, Botstein D (2000) Singular value decomposition for genome-wide expression data processing and modeling. Proc Natl Acad Sci USA 97:10101\u201310106","journal-title":"Proc Natl Acad Sci USA"},{"key":"8049_CR2","first-page":"120","volume-title":"The analysis of gene expression data: methods and software","author":"LC And","year":"2003","unstructured":"And LC, Wong WH (2003) Dna-Chip analyzer (Dchip). In: Parmigiani G, Garrett ES, Irizarry R, AndZeger SL (eds) The analysis of gene expression data: methods and software. Springer, New York, pp 120\u2013141"},{"issue":"1","key":"8049_CR3","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1093\/bioinformatics\/btg385","volume":"20","author":"M Benito","year":"2004","unstructured":"Benito M, Parker J, Du Q, Wu J, Xiang D, Perou CM, Marron JS (2004) Adjustment of systematic microarray data biases. Bioinformatics 20(1):105\u2013114. https:\/\/doi.org\/10.1093\/bioinformatics\/btg385","journal-title":"Bioinformatics"},{"key":"8049_CR4","doi-asserted-by":"publisher","DOI":"10.3389\/fgene.2014.00354","author":"OD Buhule","year":"2014","unstructured":"Buhule OD, Minster RL, Hawley NL, Medvedovic M, Sun G, Viali S, Deka R, Mcgarvey S, Weeks DE (2014) Stratified randomization controls better for batch effects in 450 K methylation analysis: a cautionary tale. Front Genet. https:\/\/doi.org\/10.3389\/fgene.2014.00354","journal-title":"Front Genet"},{"issue":"2","key":"8049_CR5","doi-asserted-by":"publisher","first-page":"e17238","DOI":"10.1371\/journal.pone.0017238","volume":"6","author":"C Chen","year":"2011","unstructured":"Chen C, Grennan K, Badner J, Zhang D, Gershon E, Jin L, Liu C (2011) Removing batch effects in analysis of expression microarray data: an evaluation of six batch adjustment methods. PLoS ONE 6(2):e17238. https:\/\/doi.org\/10.1371\/journal.pone.0017238","journal-title":"PLoS ONE"},{"key":"8049_CR6","doi-asserted-by":"publisher","first-page":"18898","DOI":"10.1038\/srep18898","volume":"6","author":"L Cheng","year":"2016","unstructured":"Cheng L, Lo L-Y, Tang NLS, Wang D, Leung K-S (2016) CrossNorm: a novel normalization strategy for microarray data in cancers. Sci Rep 6:18898. https:\/\/doi.org\/10.1038\/srep18898","journal-title":"Sci Rep"},{"key":"8049_CR7","doi-asserted-by":"publisher","first-page":"569","DOI":"10.1016\/j.tig.2013.05.010","volume":"29","author":"E Eisenberg","year":"2013","unstructured":"Eisenberg E, Levanon EY (2013) Human housekeeping genes, revisited. Trends Genet 29:569\u2013574","journal-title":"Trends Genet"},{"key":"8049_CR8","doi-asserted-by":"publisher","first-page":"539","DOI":"10.1093\/biostatistics\/kxr034","volume":"13","author":"JA Gagnon-Bartsch","year":"2012","unstructured":"Gagnon-Bartsch JA, Speed TP (2012) Using control genes to correct for unwanted variation in microarray data. Biostatistics 13:539\u2013552","journal-title":"Biostatistics"},{"issue":"S2","key":"8049_CR9","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1186\/s12864-017-3490-3","volume":"18","author":"GWW Goh","year":"2017","unstructured":"Goh GWW, Wong L (2017) Protein complex-based analysis is resistant to the obfuscating consequences of batch effects\u2014a case study in clinical proteomics. BMC Genom 18(S2):142. https:\/\/doi.org\/10.1186\/s12864-017-3490-3","journal-title":"BMC Genom"},{"issue":"6","key":"8049_CR10","doi-asserted-by":"publisher","first-page":"1052","DOI":"10.1158\/1055-9965.EPI-13-0114","volume":"22","author":"KN Harper","year":"2013","unstructured":"Harper KN, Peters BA, Gamble MV (2013) Batch effects and pathway analysis: two potential perils in cancer studies involving DNA methylation array analysis. Cancer Epidemiol Biomark Prev 22(6):1052\u20131060","journal-title":"Cancer Epidemiol Biomark Prev"},{"issue":"1","key":"8049_CR11","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1093\/biostatistics\/kxv026","volume":"17","author":"L Jacob","year":"2016","unstructured":"Jacob L, Gagnon-Bartsch JA, Speed TP (2016) Correcting gene expression data when neither the unwanted variation nor the factor of interest are observed. Biostatistics 17(1):16\u201328. https:\/\/doi.org\/10.1093\/biostatistics\/kxv026","journal-title":"Biostatistics"},{"key":"8049_CR12","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1093\/biostatistics\/kxj037","volume":"8","author":"WE Johnson","year":"2007","unstructured":"Johnson WE, Li C, Rabinovic A (2007) Adjusting batch effects in microarray expression data using empirical Bayes methods. Biostatistics 8:118\u2013127","journal-title":"Biostatistics"},{"key":"8049_CR13","doi-asserted-by":"publisher","first-page":"1724","DOI":"10.1371\/journal.pgen.0030161","volume":"3","author":"JT Leek","year":"2007","unstructured":"Leek JT, Storey JD (2007) Capturing heterogeneity in gene expression studies by surrogate variable analysis. PLoS Genet 3:1724\u20131735","journal-title":"PLoS Genet"},{"issue":"6","key":"8049_CR14","doi-asserted-by":"publisher","first-page":"882","DOI":"10.1093\/bioinformatics\/bts034","volume":"28","author":"JT Leek","year":"2012","unstructured":"Leek JT, Johnson E, Parker HS, Jaffe A, Storey J (2012) The SVA package for removing batch effects and other unwanted variation in high-throughput experiments. Bioinformatics 28(6):882\u2013883. https:\/\/doi.org\/10.1093\/bioinformatics\/bts034","journal-title":"Bioinformatics"},{"key":"8049_CR15","unstructured":"Leek JT, Johnson WE, Parker HS, Fertig EJ, Jaffe AE, Zhang Y, Storey JD, Torres LC (2019) SVA\u2014surrogate variable analysis. Bioconductor Version: Release (3.9), pp 1\u201322"},{"key":"8049_CR16","doi-asserted-by":"publisher","first-page":"358","DOI":"10.3389\/fbioe.2019.00358","volume":"7","author":"X Liu","year":"2019","unstructured":"Liu X, Li N, Liu S, Wang J, Zhang N, Zheng X, Leung K-S, Cheng L (2019) Normalization methods for the analysis of unbalanced transcriptome data: a review. Front Bioeng Biotechnol 7:358. https:\/\/doi.org\/10.3389\/fbioe.2019.00358","journal-title":"Front Bioeng Biotechnol"},{"issue":"4","key":"8049_CR17","doi-asserted-by":"publisher","first-page":"278","DOI":"10.1038\/tpj.2010.57","volume":"10","author":"J Luo","year":"2010","unstructured":"Luo J, Schumacher M, Scherer A, Sanoudou D, Megherbi D, Davison T, Shi T, Tong W, Shi L, Hong H, Zhao C, Elloumi F, Shi W, Thomas R, Lin S, Tillinghast G, Liu G, Zhou Y, Herman D, Li Y, Deng Y, Fang H, Bushel P, Woods M, Zhang J (2010) A comparison of batch effect removal methods for enhancement of prediction performance using MAQC-II microarray gene expression data. Pharmacogenom J 10(4):278\u2013291. https:\/\/doi.org\/10.1038\/tpj.2010.57","journal-title":"Pharmacogenom J"},{"issue":"1","key":"8049_CR18","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1093\/clinchem\/46.1.100","volume":"46","author":"RF Martin","year":"2000","unstructured":"Martin RF (2000) General deming regression for estimating systematic bias and its confidence interval in method-comparison studies. Clin Chem 46(1):100\u2013104","journal-title":"Clin Chem"},{"issue":"6","key":"8049_CR19","doi-asserted-by":"publisher","first-page":"0156594","DOI":"10.1371\/journal","volume":"11","author":"C M\u00fcller","year":"2016","unstructured":"M\u00fcller C, Schillert A, R\u00f6themeier C, Tr\u00e9gou\u00ebt DA, Proust C, Binder H, Pfeiffer N, Beutel M, Lackner KJ, Schnabel RB, Tiret L, Wild PS, Blankenberg S, Zeller T, Andreas Ziegler A (2016) Removing batch effects from longitudinal gene expression\u2014quantile normalization plus as best approach for microarray transcriptome data. PLoS ONE 11(6):0156594. https:\/\/doi.org\/10.1371\/journal","journal-title":"PLoS ONE"},{"issue":"9314","key":"8049_CR20","doi-asserted-by":"publisher","first-page":"1301","DOI":"10.1016\/S0140-6736(02)08270-3","volume":"359","author":"TO Nielsen","year":"2002","unstructured":"Nielsen TO, West RB, Linn SC, Alter O, Knowling MA, O\u2019connell JX, Zhu S, Fero M, Sherlock G, Pollack JR, Brown PO, Botstein D, Van de Rijn M (2002) Molecular characterisation of soft tissue tumours: a gene expression study. Lancet 359(9314):1301\u20131307. https:\/\/doi.org\/10.1016\/S0140-6736(02)08270-3","journal-title":"Lancet"},{"issue":"1","key":"8049_CR21","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1093\/biostatistics\/kxv027","volume":"17","author":"V Nygaard","year":"2016","unstructured":"Nygaard V, R\u00f8dland EA, Hovig E (2016) Methods that remove batch effects while retaining group differences may lead to exaggerated confidence in downstream analyses. Biostatistics 17(1):29\u201339. https:\/\/doi.org\/10.1093\/biostatistics\/kxv027","journal-title":"Biostatistics"},{"issue":"19","key":"8049_CR22","doi-asserted-by":"publisher","first-page":"2757","DOI":"10.1093\/bioinformatics\/btu375","volume":"30","author":"HS Parker","year":"2014","unstructured":"Parker HS, Leek JT, Favorov AV, Considine M, Xia X, Chavan S, Chung CH, Fertig EJ (2014) Preserving biological heterogeneity with a permuted surrogate variable analysis for genomics batch correction. Bioinformatics 30(19):2757\u20132763. https:\/\/doi.org\/10.1093\/bioinformatics\/btu375","journal-title":"Bioinformatics"},{"issue":"11","key":"8049_CR23","doi-asserted-by":"publisher","first-page":"709","DOI":"10.1515\/cclm.1983.21.11.709","volume":"21","author":"H Passing","year":"1983","unstructured":"Passing H, Bablok W (1983) A new biometrical procedure for testing the equality of measurements from two different analytical methods. Application of linear regression procedures for method comparison studies in clinical chemistry, Part I. J Clin Chem Clin Biochem Z Fur Klin Chem Und Klin Biochem 21(11):709\u2013720. https:\/\/doi.org\/10.1515\/cclm.1983.21.11.709","journal-title":"J Clin Chem Clin Biochem Z Fur Klin Chem Und Klin Biochem"},{"issue":"14","key":"8049_CR24","doi-asserted-by":"publisher","first-page":"2318","DOI":"10.1093\/bioinformatics\/btv157","volume":"31","author":"P Patil","year":"2015","unstructured":"Patil P, Bachant-Winner P-O, Haibe-Kains B, Leek JT (2015) Test set bias affects reproducibility of gene signatures. Bioinformatics 31(14):2318\u20132323. https:\/\/doi.org\/10.1093\/bioinformatics\/btv157","journal-title":"Bioinformatics"},{"key":"8049_CR25","doi-asserted-by":"publisher","first-page":"83","DOI":"10.3389\/fgene.2018.00083","volume":"9","author":"EM Price","year":"2018","unstructured":"Price EM, Robinson WP (2018) Adjusting for batch effects in DNA methylation microarray data, a lesson learned. Front Genet 9:83. https:\/\/doi.org\/10.3389\/fgene.2018.00083","journal-title":"Front Genet"},{"key":"8049_CR26","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1186\/1755-8794-1-42","volume":"1","author":"AH Sims","year":"2008","unstructured":"Sims AH, Smethurst GJ, Hey Y, Okoniewski MJ, Pepper SD, Howell A, Miller CJ, Clarke RB (2008) The removal of multiplicative, systematic bias allows integration of breast cancer gene expression datasets - improving meta-analysis and prediction of prognosis. BMC Med Genom 1:42. https:\/\/doi.org\/10.1186\/1755-8794-1-42","journal-title":"BMC Med Genom"},{"key":"8049_CR27","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1186\/s12859-015-0478-3","volume":"16","author":"CK Stein","year":"2015","unstructured":"Stein CK, Qu P, Epstein J, Buros A, Rosenthal A, Crowley J, Morgan G, Barlogie B (2015) Removing batch effects from purified plasma cell gene expression microarrays with modified. BMC Bioinform 16:63. https:\/\/doi.org\/10.1186\/s12859-015-0478-3","journal-title":"BMC Bioinform"},{"issue":"18","key":"8049_CR28","doi-asserted-by":"publisher","first-page":"3357","DOI":"10.1093\/bioinformatics\/btz066","volume":"35","author":"H Weishaupt","year":"2019","unstructured":"Weishaupt H, Johansson P, Sundstr\u00f6m A, Lubovac-Pilav Z, Olsson B, Nelander S, Swartling FJ (2019) Batch-normalization of cerebellar and medulloblastoma gene expression datasets utilizing empirically defined negative control genes. Bioinformatics 35(18):3357\u20133364","journal-title":"Bioinformatics"},{"issue":"9","key":"8049_CR29","doi-asserted-by":"publisher","first-page":"research0048","DOI":"10.1186\/gb-2002-3-9-research0048","volume":"3","author":"C Workman","year":"2002","unstructured":"Workman C, Jensen LJ, Jarmer H, Berka R, Gautier L, Nielser HB, Saxild H, Nielsen C, Brunak S, Knudsen S (2002) A new non-linear normalization method for reducing variability in DNA microarray experiments. Genome Biol 3(9):research0048","journal-title":"Genome Biol"},{"issue":"5","key":"8049_CR30","doi-asserted-by":"publisher","first-page":"2267","DOI":"10.1002\/int.22378","volume":"36","author":"A Yosef","year":"2021","unstructured":"Yosef A, Shnaider E, Schneider M (2021) New concepts of cluster construction and similarity measurement. Int J Intell Syst 36(5):2267\u20132291","journal-title":"Int J Intell Syst"},{"key":"8049_CR31","doi-asserted-by":"publisher","first-page":"262","DOI":"10.1186\/s12859-018-2263-6","volume":"19","author":"Y Zhang","year":"2018","unstructured":"Zhang Y, Jenkins DF, Manimaran S, Johnson E (2018) Alternative empirical Bayes models for adjusting for batch effects in genomic studies. BMC Bioinform 19:262. https:\/\/doi.org\/10.1186\/s12859-018-2263-6","journal-title":"BMC Bioinform"},{"issue":"9","key":"8049_CR32","doi-asserted-by":"publisher","first-page":"433","DOI":"10.1016\/j.jgg.2019.08.002","volume":"46","author":"L Zhou","year":"2019","unstructured":"Zhou L, Chi-Hau SA, Bin Goh WW (2019) Examining the practical limits of batch effect-correction algorithms: when should you care about batch effects? J Genet Genom 46(9):433\u2013443. https:\/\/doi.org\/10.1016\/j.jgg.2019.08.002","journal-title":"J Genet Genom"},{"key":"8049_CR33","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1186\/s12859-020-03559-6","volume":"21","author":"T Zindler","year":"2020","unstructured":"Zindler T, Frieling H, Neyazi A, Bleich S, Friedel E (2020) Simulating ComBat: how batch correction can lead to the systematic introduction of false positive results in DNA methylation microarray studies. BMC Bioinform 21:271. https:\/\/doi.org\/10.1186\/s12859-020-03559-6","journal-title":"BMC Bioinform"}],"container-title":["Soft Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-023-08049-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00500-023-08049-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00500-023-08049-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T14:23:55Z","timestamp":1684333435000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00500-023-08049-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,29]]},"references-count":33,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2023,6]]}},"alternative-id":["8049"],"URL":"https:\/\/doi.org\/10.1007\/s00500-023-08049-4","relation":{},"ISSN":["1432-7643","1433-7479"],"issn-type":[{"value":"1432-7643","type":"print"},{"value":"1433-7479","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,3,29]]},"assertion":[{"value":"13 March 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 March 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have not disclosed any competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}]}}