{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T10:05:10Z","timestamp":1743156310009,"version":"3.40.3"},"publisher-location":"Cham","reference-count":36,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030792893"},{"type":"electronic","value":"9783030792909"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-79290-9_11","type":"book-chapter","created":{"date-parts":[[2021,7,2]],"date-time":"2021-07-02T14:03:32Z","timestamp":1625234612000},"page":"127-141","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Clustering Based Identification of SARS-CoV-2 Subtypes"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3943-0839","authenticated-orcid":false,"given":"Andrew","family":"Melnyk","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1395-1051","authenticated-orcid":false,"given":"Fatemeh","family":"Mohebbi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0385-1831","authenticated-orcid":false,"given":"Sergey","family":"Knyazev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6481-2583","authenticated-orcid":false,"given":"Bikram","family":"Sahoo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0747-8245","authenticated-orcid":false,"given":"Roya","family":"Hosseini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4007-5624","authenticated-orcid":false,"given":"Pavel","family":"Skums","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4424-4691","authenticated-orcid":false,"given":"Alex","family":"Zelikovsky","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4329-0234","authenticated-orcid":false,"given":"Murray","family":"Patterson","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,7,3]]},"reference":[{"key":"11_CR1","unstructured":"EMBL-EBI: Wellcome Genome Campus, Hinxton, Cambridgeshire"},{"key":"11_CR2","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1007\/978-3-319-56970-3_22","volume-title":"Research in Computational Molecular Biology","author":"S Ahn","year":"2017","unstructured":"Ahn, S., Vikalo, H.: aBayesQR: a Bayesian method for reconstruction of viral populations characterized by low diversity. In: Sahinalp, S.C. (ed.) RECOMB 2017. LNCS, vol. 10229, pp. 353\u2013369. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-56970-3_22"},{"key":"11_CR3","volume-title":"Cluster Analysis for Applications","author":"M Anderberg","year":"1973","unstructured":"Anderberg, M.: Cluster Analysis for Applications. Academic Press, Cambridge (1973)"},{"issue":"5","key":"11_CR4","doi-asserted-by":"publisher","first-page":"835","DOI":"10.1101\/gr.215038.116","volume":"27","author":"JA Baaijens","year":"2017","unstructured":"Baaijens, J.A., El Aabidine, A.Z., Rivals, E., Sch\u00f6nhuth, A.: De novo assembly of viral quasispecies using overlap graphs. Genome Res. 27(5), 835\u2013848 (2017)","journal-title":"Genome Res."},{"issue":"8","key":"11_CR5","doi-asserted-by":"publisher","first-page":"e2017521","DOI":"10.1001\/jamanetworkopen.2020.17521","volume":"3","author":"Q Bukhari","year":"2020","unstructured":"Bukhari, Q., Jameel, Y., Massaro, J., D\u2019Agostino, R., Khan, S.: Periodic oscillations in daily reported infections and deaths for coronavirus disease 2019. JAMA Netw. Open 3(8), e2017521 (2020). https:\/\/doi.org\/10.1001\/jamanetworkopen.2020.17521","journal-title":"JAMA Netw. Open"},{"issue":"1","key":"11_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1080\/03610927408827101","volume":"3","author":"T Cali\u0144ski","year":"1974","unstructured":"Cali\u0144ski, T., Harabasz, J.: A dendrite method for cluster analysis. Commun. Stat. 3(1), 1\u201327 (1974). https:\/\/doi.org\/10.1080\/03610927408827101","journal-title":"Commun. Stat."},{"key":"11_CR7","doi-asserted-by":"publisher","unstructured":"Ciccolella, S., Patterson, M., Bonizzoni, P., Vedova, G.D.: Effective clustering for single cell sequencing cancer data. In: The 10th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics, ACM-BCB, Niagara Falls, NY, USA, pp. 437\u2013446. ACM (2019). https:\/\/doi.org\/10.1145\/3307339.3342149","DOI":"10.1145\/3307339.3342149"},{"issue":"3","key":"11_CR8","doi-asserted-by":"publisher","first-page":"326","DOI":"10.1093\/bioinformatics\/btaa722","volume":"37","author":"S Ciccolella","year":"2020","unstructured":"Ciccolella, S., et al.: Inferring cancer progression from single-cell sequencing while allowing mutation losses. Bioinformatics 37(3), 326\u2013333 (2020). https:\/\/doi.org\/10.1093\/bioinformatics\/btaa722","journal-title":"Bioinformatics"},{"key":"11_CR9","doi-asserted-by":"publisher","unstructured":"Ciccolella, S., Soto, M., Patterson, M.D., Vedova, G.D., Hajirasouliha, I., Bonizzoni, P.: gpps: an ILP-based approach for inferring cancer progression with mutation losses from single cell data. BMC Bioinform. 21 (2020). Article number: 413. https:\/\/doi.org\/10.1186\/s12859-020-03736-7","DOI":"10.1186\/s12859-020-03736-7"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"The COVID-19 Genomics UK (COG-UK) Consortium: An integrated national scale SARS-CoV-2 genomic surveillance network. Lancet Microbe 1(3), 99\u2013100 (2020)","DOI":"10.1016\/S2666-5247(20)30054-9"},{"key":"11_CR11","doi-asserted-by":"publisher","unstructured":"Davies, D.L., Bouldin, D.W.: A cluster separation measure. IEEE Trans. Pattern Anal. Mach. Intell. PAMI-1(2), 224\u2013227 (1979). https:\/\/doi.org\/10.1109\/TPAMI.1979.4766909","DOI":"10.1109\/TPAMI.1979.4766909"},{"key":"11_CR12","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1002\/gch2.1018","volume":"1","author":"S Elbe","year":"2017","unstructured":"Elbe, S., Buckland-Merrett, G.: Data, disease and diplomacy: GISAID\u2019s innovative contribution to global health. Glob. Chall. 1, 33\u201346 (2017). https:\/\/doi.org\/10.1002\/gch2.1018","journal-title":"Glob. Chall."},{"key":"11_CR13","unstructured":"Public Health England: Investigation of novel SARS-CoV-2 variant: variant of concern 202012\/01. Technical briefing 1 (2021)"},{"issue":"23","key":"11_CR14","doi-asserted-by":"publisher","first-page":"4121","DOI":"10.1093\/bioinformatics\/bty407","volume":"34","author":"J Hadfield","year":"2018","unstructured":"Hadfield, J., et al.: Nextstrain: real-time tracking of pathogen evolution. Bioinformatics 34(23), 4121\u20134123 (2018). https:\/\/doi.org\/10.1093\/bioinformatics\/bty407","journal-title":"Bioinformatics"},{"key":"11_CR15","unstructured":"Huang, Z.: A fast clustering algorithm to cluster very large categorical data sets in data mining. In: The SIGMOD Workshop on Research Issues on Data Mining and Knowledge Discovery, pp. 1\u20138 (1997)"},{"issue":"3","key":"11_CR16","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1023\/A:1009769707641","volume":"2","author":"Z Huang","year":"1998","unstructured":"Huang, Z.: Extensions to the k-means algorithm for clustering large data sets with categorical values. Data Min. Knowl. Discov. 2(3), 283\u2013304 (1998). https:\/\/doi.org\/10.1023\/A:1009769707641","journal-title":"Data Min. Knowl. Discov."},{"key":"11_CR17","doi-asserted-by":"publisher","unstructured":"Jahn, K., Kuipers, J., Beerenwinkel, N.: Tree inference for single-cell data. Genome Biol. 17(1) (2016). Article number: 86. https:\/\/doi.org\/10.1186\/s13059-016-0936-x","DOI":"10.1186\/s13059-016-0936-x"},{"key":"11_CR18","doi-asserted-by":"publisher","unstructured":"James, B., Luczak, B., Girgis, H.: MeShClust: an intelligent tool for clustering DNA sequences. Nucleic Acid Res. 46(14) (2018). https:\/\/doi.org\/10.1093\/nar\/gky315","DOI":"10.1093\/nar\/gky315"},{"key":"11_CR19","doi-asserted-by":"publisher","unstructured":"Kammonen, J.I., et al.: gapFinisher: a reliable gap filling pipeline for SSPACE-LongRead scaffolder output (2019). https:\/\/doi.org\/10.1371\/journal.pone.0216885","DOI":"10.1371\/journal.pone.0216885"},{"key":"11_CR20","doi-asserted-by":"publisher","unstructured":"Knyazev, S., Hughes, L., Skums, P., Zelikovsky, A.: Epidemiological data analysis of viral quasispecies in the next-generation sequencing era. Brief. Bioinform. (2020). https:\/\/doi.org\/10.1093\/bib\/bbaa101","DOI":"10.1093\/bib\/bbaa101"},{"key":"11_CR21","doi-asserted-by":"publisher","unstructured":"Knyazev, S., et al.: CliqueSNV: scalable reconstruction of intra-host viral populations from NGS reads. bioRxiv (2018). https:\/\/doi.org\/10.1101\/264242","DOI":"10.1101\/264242"},{"key":"11_CR22","doi-asserted-by":"publisher","unstructured":"Li, T., Ma, S., Ogihara, M.: Entropy-based criterion in categorical clustering. In: Twenty-First International Conference on Machine Learning (2004). https:\/\/doi.org\/10.1145\/1015330.1015404","DOI":"10.1145\/1015330.1015404"},{"key":"11_CR23","unstructured":"McQueen, J.: Some methods for classification and analysis of multivariate observations. In: The 5th Berkely Symposium on Mathematical Statistics and Probability, pp. 281\u2013297 (1967)"},{"key":"11_CR24","doi-asserted-by":"publisher","DOI":"10.1126\/science.abf2946","author":"L du Plessis","year":"2021","unstructured":"du Plessis, L., et al.: Establishment and lineage dynamics of the SARS-CoV-2 epidemic in the UK. Science (2021). https:\/\/doi.org\/10.1126\/science.abf2946","journal-title":"Science"},{"issue":"1","key":"11_CR25","doi-asserted-by":"publisher","first-page":"182","DOI":"10.1109\/TCBB.2013.145","volume":"11","author":"S Prabhakaran","year":"2014","unstructured":"Prabhakaran, S., Rey, M., Zagordi, O., Beerenwinkel, N., Roth, V.: HIV haplotype inference using a propagating Dirichlet process mixture model. IEEE\/ACM Trans. Comput. Biol. Bioinform. (TCBB) 11(1), 182\u2013191 (2014)","journal-title":"IEEE\/ACM Trans. Comput. Biol. Bioinform. (TCBB)"},{"key":"11_CR26","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw, P.J.: Silhouettes: a graphical aid to the interpretation and validation of cluster analysis. J. Comput. Appl. Math. 20, 53\u201365 (1987). https:\/\/doi.org\/10.1016\/0377-0427(87)90125-7","journal-title":"J. Comput. Appl. Math."},{"issue":"20","key":"11_CR27","doi-asserted-by":"publisher","first-page":"6097","DOI":"10.1093\/nar\/18.20.6097","volume":"18","author":"TD Schneider","year":"1990","unstructured":"Schneider, T.D., Stephens, R.: Sequence logos: a new way to display consensus sequences. Nucleic Acids Res. 18(20), 6097\u20136100 (1990). https:\/\/doi.org\/10.1093\/nar\/18.20.6097","journal-title":"Nucleic Acids Res."},{"issue":"5","key":"11_CR28","first-page":"263","volume":"11","author":"P Skums","year":"2011","unstructured":"Skums, P., Campo, D.S., Dimitrova, Z., Vaughan, G., Lau, D.T., Khudyakov, Y.: Numerical detection, measuring and analysis of differential interferon resistance for individual HCV intra-host variants and its influence on the therapy response. Silico Biol. 11(5), 263\u2013269 (2011)","journal-title":"Silico Biol."},{"key":"11_CR29","doi-asserted-by":"publisher","unstructured":"Skums, P., Kirpich, A., Baykal, P.I., Zelikovsky, A., Chowell, G.: Global transmission network of SARS-CoV-2: from outbreak to pandemic. medRxiv (2020). https:\/\/doi.org\/10.1101\/2020.03.22.20041145","DOI":"10.1101\/2020.03.22.20041145"},{"issue":"3","key":"11_CR30","first-page":"512","volume":"10","author":"K Tamura","year":"1993","unstructured":"Tamura, K., Nei, M.: Estimation of the number of nucleotide substitutions in the control region of mitochondrial DNA in humans and chimpanzees. Mol. Biol. Evol. 10(3), 512\u2013526 (1993)","journal-title":"Mol. Biol. Evol."},{"issue":"2","key":"11_CR31","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1111\/1467-9868.00293","volume":"63","author":"R Tibshirani","year":"2001","unstructured":"Tibshirani, R., Walther, G., Hastie, T.: Estimating the number of clusters in a data set via the gap statistic. J. Roy. Stat. Soc. 63(2), 411\u2013423 (2001)","journal-title":"J. Roy. Stat. Soc."},{"key":"11_CR32","doi-asserted-by":"publisher","unstructured":"Volz, E., et al.: Transmission of SARS-CoV-2 lineage b.1.1.7 in England: insights from linking epidemiological and genetic data. medRxiv (2021). https:\/\/doi.org\/10.1101\/2020.12.30.20249034","DOI":"10.1101\/2020.12.30.20249034"},{"issue":"1","key":"11_CR33","doi-asserted-by":"publisher","first-page":"355","DOI":"10.1186\/s12859-015-0791-x","volume":"16","author":"I Vrbik","year":"2015","unstructured":"Vrbik, I., Stephens, D.A., Roger, M., Brenner, B.G.: The Gap Procedure: for the identification of phylogenetic clusters in HIV-1 sequence data. BMC Bioinform. 16(1), 355 (2015). https:\/\/doi.org\/10.1186\/s12859-015-0791-x","journal-title":"BMC Bioinform."},{"key":"11_CR34","unstructured":"W.H.O.: update, December 2020"},{"issue":"7798","key":"11_CR35","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1038\/s41586-020-2008-3","volume":"579","author":"F Wu","year":"2020","unstructured":"Wu, F., et al.: A new coronavirus associated with human respiratory disease in China. Nature 579(7798), 265\u2013269 (2020). https:\/\/doi.org\/10.1038\/s41586-020-2008-3","journal-title":"Nature"},{"issue":"7798","key":"11_CR36","doi-asserted-by":"publisher","first-page":"270","DOI":"10.1038\/s41586-020-2012-7","volume":"579","author":"P Zhou","year":"2020","unstructured":"Zhou, P., et al.: A pneumonia outbreak associated with a new coronavirus of probable bat origin. Nature 579(7798), 270\u2013273 (2020). https:\/\/doi.org\/10.1038\/s41586-020-2012-7","journal-title":"Nature"}],"container-title":["Lecture Notes in Computer Science","Computational Advances in Bio and Medical Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-79290-9_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,7,2]],"date-time":"2021-07-02T14:04:48Z","timestamp":1625234688000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-79290-9_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030792893","9783030792909"],"references-count":36,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-79290-9_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"3 July 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICCABS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Computational Advances in Bio and Medical Sciences","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 December 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 December 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iccabs2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/iccabs.engr.uconn.edu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}