{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T16:03:36Z","timestamp":1772121816920,"version":"3.50.1"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,10,14]],"date-time":"2024-10-14T00:00:00Z","timestamp":1728864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2024,10,14]],"date-time":"2024-10-14T00:00:00Z","timestamp":1728864000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/s12859-024-05955-8","type":"journal-article","created":{"date-parts":[[2024,10,14]],"date-time":"2024-10-14T13:02:00Z","timestamp":1728910920000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["DNASimCLR: a contrastive learning-based deep learning approach for gene sequence data classification"],"prefix":"10.1186","volume":"25","author":[{"given":"Minghao","family":"Yang","sequence":"first","affiliation":[]},{"given":"Zehua","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Zizhuo","family":"Yan","sequence":"additional","affiliation":[]},{"given":"Wenxiang","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Qian","family":"Zhu","sequence":"additional","affiliation":[]},{"given":"Changlong","family":"Jin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,10,14]]},"reference":[{"key":"5955_CR1","doi-asserted-by":"publisher","first-page":"102539","DOI":"10.1016\/j.bspc.2021.102539","volume":"67","author":"KM Alt\u0131n","year":"2021","unstructured":"Alt\u0131n KM, Nalbantogl OU. Taxonomic classification of metage-nomic sequences from relative abundance index profiles using deep learning. Biomed Signal Process Control. 2021;67:102539.","journal-title":"Biomed Signal Process Control"},{"key":"5955_CR2","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"SF Altschul","year":"1990","unstructured":"Altschul SF, Gish W, Miller W, Myers EW, Lipman DJ. Basic local alignment search tool. J Mol Biol. 1990;215:403\u201310.","journal-title":"J Mol Biol."},{"issue":"Suppl 7","key":"5955_CR3","first-page":"61","volume":"19","author":"F Antonino","year":"2018","unstructured":"Antonino F, Laura LP, Massimo LR, Giosu\u00e8 LB, Giovanni R, Riccardo R, Salvatore G, Alfonso U. Deep learning models for bacteria taxonomic classification of metagenomic data. BMC Bioinform. 2018;19(Suppl 7):61\u201376.","journal-title":"BMC Bioinform."},{"issue":"8","key":"5955_CR4","doi-asserted-by":"publisher","first-page":"14820","DOI":"10.1111\/jeb.13099","volume":"30","author":"SJE Baird","year":"2017","unstructured":"Baird SJE. The impact of high-throughput sequencing technology on speciation research: maintaining perspective. J Evolut Biol. 2017;30(8):14820\u201370.","journal-title":"J Evolut Biol."},{"issue":"1","key":"5955_CR5","doi-asserted-by":"publisher","first-page":"lqab004","DOI":"10.1093\/nargab\/lqab004","volume":"3","author":"JM Bartoszewicz","year":"2021","unstructured":"Bartoszewicz JM, Seidel A, Renard BY. Interpretable detection of novel human viruses from genome sequencing data. NAR Genom Bioinform. 2021;3(1):lqab004.","journal-title":"NAR Genom Bioinform."},{"key":"5955_CR6","unstructured":"Benjamin E., Tianjun Z., Ruslan S., Sergey L. Contrastive Learning as Goal-Conditioned Reinforcement Learning. Conference on Neural Information Processing Systems (2022)"},{"key":"5955_CR7","doi-asserted-by":"publisher","first-page":"262","DOI":"10.1186\/1471-2105-15-262","volume":"15","author":"AL Byrd","year":"2014","unstructured":"Byrd AL, Perez-Rogers JF, Manimaran S, Castro-Nallar E, Toma I, McCaffrey T, Siegel M, Benson G, Crandall KA, Johnson WE. Clinical pathoscope: rapid alignment and filtration for accurate pathogen identification in clinical samples using unassembled sequencing data. BMC Bioinform. 2014;15:262.","journal-title":"BMC Bioinform"},{"key":"5955_CR8","unstructured":"Chen T., Simon K., Mohammad N., Geoffrey H. A simple framework for contrastive learning of visual representations. International Conference on Machine Learning. PMLR. 2020."},{"key":"5955_CR9","first-page":"22243","volume":"33","author":"T Chen","year":"2020","unstructured":"Chen T, Simon K, Kevin S, Mohammad N, Geoffrey H. Big self-supervised models are strong semi-supervised learners. Conf Neural Inform Process Syst. 2020;33:22243\u201355.","journal-title":"Conf Neural Inform Process Syst"},{"key":"5955_CR10","first-page":"04297","volume":"9","author":"X Chen","year":"2020","unstructured":"Chen X, Fan H, Girshick R, He K. Improved baselines with momentum contrastive learning. Learning. 2020;9:04297.","journal-title":"Learning"},{"key":"5955_CR11","first-page":"9620","volume":"57","author":"X Chen","year":"2021","unstructured":"Chen X, Xie S, He K. An empirical study of training self-supervised vision transformers. IEEE Int Conf Comput Vis. 2021;57:9620\u20139.","journal-title":"IEEE Int Conf Comput Vis."},{"issue":"3","key":"5955_CR12","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1093\/bioinformatics\/btaa705","volume":"37","author":"M Florian","year":"2021","unstructured":"Florian M, Adrian V, Emanuel B, Manja M. Vidhop, viral host prediction with deep learning. Bioinformatics. 2021;37(3):318\u201325.","journal-title":"Bioinformatics"},{"key":"5955_CR13","unstructured":"Florian M., Fleming K., Anton K., Sebastian B., Manja M.: BERTax: Taxonomic Classification of DNA Sequences with Deep Neural Networks (2021)"},{"issue":"7","key":"5955_CR14","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1038\/s41576-019-0122-6","volume":"20","author":"E G\u00f6kcen","year":"2019","unstructured":"G\u00f6kcen E, \u017diga A, Julien G, Fabian JT. Deep learning: new computational modelling techniques for genomics. Nat Rev Genet. 2019;20(7):389\u2013403.","journal-title":"Nat Rev Genet."},{"issue":"Pt 2","key":"5955_CR15","first-page":"155915","volume":"838","author":"C Gargi","year":"2022","unstructured":"Gargi C, Sangeeta N, Supratim B, Joel F, Anthonia O, Pratyoosh S, et al. Microbiome systems biology advancements for natural well-being. Sci Total Environ. 2022;838(Pt 2):155915.","journal-title":"Sci Total Environ."},{"key":"5955_CR16","first-page":"21271","volume":"33","author":"J Grill","year":"2020","unstructured":"Grill J, Strub F, Altch\u00e9 F, Tallec C, Richemond PH, Buchatskaya E, et al. Bootstrap your own latent - a new approach to self-supervised learning. Conf Neural Inform Process Syst. 2020;33:21271\u201384.","journal-title":"Conf Neural Inform Process Syst."},{"key":"5955_CR17","first-page":"1","volume":"4","author":"L Haifeng","year":"2023","unstructured":"Haifeng L, Jun C, Jiawei Z, Qinyao L, Silu H, Xuyin W. Augmentation-free graph contrastive learning of invariant-discriminative representations. IEEE Trans Neural Netw Learn Syst. 2023;4:1\u201311.","journal-title":"IEEE Trans Neural Netw Learn Syst."},{"issue":"1","key":"5955_CR18","first-page":"9726","volume":"2020","author":"H Kaiming","year":"2020","unstructured":"Kaiming H, Haoqi F, Yuxin W, Saining X, Ross G. Momentum contrast for unsupervised visual representation learning. Comput Vis Patt Recogn. 2020;2020(1):9726\u201335.","journal-title":"Comput Vis Patt Recogn."},{"issue":"1","key":"5955_CR19","first-page":"770","volume":"03385","author":"H Kaiming","year":"2016","unstructured":"Kaiming H, Xiangyu Z, Shaoqing R, Jian S. Deep residual learning for image recognition. Proc IEEE Comput Soc Conf Comput Vis Patt Recogn. 2016;03385(1):770\u20138.","journal-title":"Proc IEEE Comput Soc Conf Comput Vis Patt Recogn."},{"key":"5955_CR20","first-page":"656","volume":"12","author":"WJ Kent","year":"2002","unstructured":"Kent WJ. Blat-the blast-like alignment tool. Genome Res. 2002;12:656\u201364.","journal-title":"Genome Res."},{"key":"5955_CR21","first-page":"18661","volume":"11362","author":"P Khosla","year":"2020","unstructured":"Khosla P, Teterwak P, Wang C, Sarna A, Tian Y, Isola P, et al. Supervised contrastive learning. Conf Neural Inform Process Syst. 2020;11362:18661\u201373.","journal-title":"Conf Neural Inform Process Syst."},{"key":"5955_CR22","doi-asserted-by":"publisher","first-page":"R25","DOI":"10.1186\/gb-2009-10-3-r25","volume":"10","author":"B Langmead","year":"2009","unstructured":"Langmead B, Trapnell C, Pop M, Salzberg SL. Ultrafast and memory-efficient alignment of short dna sequences to the human genome. Genome Biol. 2009;10:R25.","journal-title":"Genome Biol."},{"key":"5955_CR23","doi-asserted-by":"publisher","first-page":"589","DOI":"10.1093\/bioinformatics\/btp698","volume":"26","author":"H Li","year":"2010","unstructured":"Li H, Durbin R. Fast and accurate long-read alignment with burrows-wheeler transform. Bioinformatics. 2010;26:589\u201395.","journal-title":"Bioinformatics"},{"issue":"1","key":"5955_CR24","doi-asserted-by":"publisher","first-page":"lqaa009","DOI":"10.1093\/nargab\/lqaa009","volume":"2","author":"Q Liang","year":"2020","unstructured":"Liang Q, Wang PB, Liu Y, Zou B, Lai W. Deepmicrobes: taxo-nomic classification for metagenomics with deep learning. NAR Genom Bioinform. 2020;2(1):lqaa009.","journal-title":"NAR Genom Bioinform."},{"key":"5955_CR25","first-page":"537795","volume":"15","author":"R Mateo","year":"2019","unstructured":"Mateo R, Ilya OT, Guillermo L, Nicholas Y, Ruth L, Bernhard S. GeNet: deep representations for metagenomics. Comput Res Repos. 2019;15:537795\u201313.","journal-title":"Comput Res Repos."},{"key":"5955_CR26","first-page":"544","volume":"95","author":"C Mengru","year":"2023","unstructured":"Mengru C, Chao H, Lianghao X, Wei W, Yong X, Ronghua L. Heterogeneous graph contrastive learning for recommendation. WSDM. 2023;95:544\u201352.","journal-title":"WSDM"},{"issue":"9","key":"5955_CR27","doi-asserted-by":"publisher","first-page":"833","DOI":"10.1038\/nbt.3935","volume":"35","author":"C Quince","year":"2017","unstructured":"Quince C, Walker AW, Simpson JT, et al. Shotgun metagenomics, from sampling to analysis. Nat Biotechnol. 2017;35(9):833.","journal-title":"Nat Biotechnol."},{"key":"5955_CR28","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1007\/s40484-019-0187-4","volume":"8","author":"J Ren","year":"2020","unstructured":"Ren J, Song K, Deng C, Ahlgren NA, Fuhrman JA, Li Y, Xie X, Poplin R, Sun F. Identifying viruses from metagenomic data by deep learning. Quantit Biol. 2020;8:64\u201377.","journal-title":"Quantit. Biol."},{"issue":"2","key":"5955_CR29","doi-asserted-by":"publisher","first-page":"546","DOI":"10.1093\/bioinformatics\/btab607","volume":"38","author":"RA Stanton","year":"2022","unstructured":"Stanton RA, Vlachos N, Laufer HA. GAMMA: a tool for the rapid identification, classification and annotation of translated gene matches from sequencing data. Bioinformatics. 2022;38(2):546\u20138.","journal-title":"Bioinformatics"},{"key":"5955_CR30","doi-asserted-by":"publisher","first-page":"e0222271","DOI":"10.1371\/journal.pone.0222271","volume":"14","author":"A Tampuu","year":"2019","unstructured":"Tampuu A, Bzhalava Z, Dillner J, Vicente R. ViraMiner: deep learning on raw DNA sequences for identifying viral genomes in human samples. PLoS ONE. 2019;14:e0222271.","journal-title":"PLoS ONE"},{"issue":"17","key":"5955_CR31","first-page":"2722","volume":"37","author":"L Wang","year":"2021","unstructured":"Wang L, \u015eenay K, Jun C, Nicholas JD, Jesper T, Robert H. Deepviral: prediction of novel virus-host interactions from protein sequences and infectious disease phenotypes. Intell Syst Mol Biol. 2021;37(17):2722\u20139.","journal-title":"Intell Syst Mol Biol."},{"issue":"1","key":"5955_CR32","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1093\/bib\/bbw005","volume":"18","author":"M Wei","year":"2017","unstructured":"Wei M, Lu Z, Pan Z, Chuanbo H, Jianwei L, Bin G, Jichun Y, Wei K, Xuezhong Z, Qinghua C. An analysis of human microbe-disease associations. Brief Bioinform. 2017;18(1):85\u201397.","journal-title":"Brief Bioinform."},{"issue":"6","key":"5955_CR33","first-page":"18","volume":"3","author":"Y Xiaoyuan","year":"2018","unstructured":"Xiaoyuan Y, Kai M, Yuxia Z, Lihong Q, Wu A, Youling W. Establishment and Application of Rapid Diagnosis for Reverse Transcription-Quantitative PCR of Newly Emerging GooseOrigin Nephrotic Astrovirus in China. mSphere. 2018;3(6):18.","journal-title":"mSphere"},{"key":"5955_CR34","first-page":"678","volume":"3","author":"W Yunzhan","year":"2023","unstructured":"Yunzhan W, Jin Y, Yunpeng C. VirusBERTHP: Improved Virus Host Prediction Via Attention-based Pre-trained Model Using Viral Genomic Sequences. IEEE Int Conf Bioinform Biomed. 2023;3:678\u201383.","journal-title":"IEEE Int Conf Bioinform Biomed."}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-024-05955-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12859-024-05955-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-024-05955-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,14]],"date-time":"2024-10-14T13:02:08Z","timestamp":1728910928000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-024-05955-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,14]]},"references-count":34,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2024,12]]}},"alternative-id":["5955"],"URL":"https:\/\/doi.org\/10.1186\/s12859-024-05955-8","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,10,14]]},"assertion":[{"value":"29 February 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 October 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 October 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"328"}}