{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T05:17:16Z","timestamp":1755839836715,"version":"3.40.5"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T00:00:00Z","timestamp":1746748800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T00:00:00Z","timestamp":1746748800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/s12859-025-06136-x","type":"journal-article","created":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T17:10:41Z","timestamp":1746810641000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["PCVR: a pre-trained contextualized visual representation for DNA sequence classification"],"prefix":"10.1186","volume":"26","author":[{"given":"Jiarui","family":"Zhou","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hui","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kang","family":"Du","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wengang","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cong-Zhao","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Houqiang","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,9]]},"reference":[{"issue":"6","key":"6136_CR1","doi-asserted-by":"publisher","first-page":"1322","DOI":"10.1109\/TCBB.2015.2403370","volume":"12","author":"K-O Cheng","year":"2015","unstructured":"Cheng K-O, Wu P, Law N-F, Siu W-C. Compression of multiple DNA sequences using intra-sequence and inter-sequence similarities. IEEE\/ACM Trans Comput Biol Bioinf. 2015;12(6):1322\u201332.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"22","key":"6136_CR2","doi-asserted-by":"publisher","first-page":"5019","DOI":"10.1093\/bioinformatics\/btac658","volume":"38","author":"Y Wei","year":"2022","unstructured":"Wei Y, Zou Q, Tang F, Yu L. WMSA: A novel method for multiple sequence alignment of DNA sequences. Bioinformatics. 2022;38(22):5019\u201325.","journal-title":"Bioinformatics"},{"issue":"17","key":"6136_CR3","doi-asserted-by":"publisher","first-page":"2899","DOI":"10.1093\/bioinformatics\/bty1050","volume":"35","author":"Z Zhuang","year":"2019","unstructured":"Zhuang Z, Shen X, Pan W. A simple convolutional neural network for prediction of enhancer-promoter interactions with DNA sequence data. Bioinformatics. 2019;35(17):2899\u2013906.","journal-title":"Bioinformatics"},{"issue":"1","key":"6136_CR4","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1186\/s12859-023-05469-9","volume":"24","author":"J Zhang","year":"2023","unstructured":"Zhang J, Liu B, Wu J, Wang Z, Li J. DeepCAC: A deep learning approach on DNA transcription factors classification based on multi-head self-attention and concatenate convolutional neural network. BMC Bioinformatics. 2023;24(1):345.","journal-title":"BMC Bioinformatics"},{"issue":"3","key":"6136_CR5","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1109\/TCBB.2024.3366240","volume":"21","author":"K Sheena","year":"2024","unstructured":"Sheena K, Nair MS. GenCoder: A novel convolutional neural network based autoencoder for genomic sequence data compression. IEEE\/ACM Trans Comput Biol Bioinf. 2024;21(3):405\u201315.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"3","key":"6136_CR6","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"SF Altschul","year":"1990","unstructured":"Altschul SF, Gish W, Miller W, Myers EW, Lipman DJ. Basic local alignment search tool. J Mol Biol. 1990;215(3):403\u201310.","journal-title":"J Mol Biol"},{"issue":"11","key":"6136_CR7","doi-asserted-by":"publisher","first-page":"1026","DOI":"10.1038\/nbt.3988","volume":"35","author":"M Steinegger","year":"2017","unstructured":"Steinegger M, S\u00f6ding J. MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets. Nat Biotechnol. 2017;35(11):1026\u20138.","journal-title":"Nat Biotechnol"},{"issue":"18","key":"6136_CR8","doi-asserted-by":"publisher","first-page":"3094","DOI":"10.1093\/bioinformatics\/bty191","volume":"34","author":"H Li","year":"2018","unstructured":"Li H. Minimap2: Pairwise alignment for nucleotide sequences. Bioinformatics. 2018;34(18):3094\u2013100.","journal-title":"Bioinformatics"},{"key":"6136_CR9","doi-asserted-by":"publisher","DOI":"10.7717\/peerj.7359","volume":"7","author":"DD Kang","year":"2019","unstructured":"Kang DD, Li F, Kirton E, Thomas A, Egan R, An H, Wang Z. MetaBAT 2: An adaptive binning algorithm for robust and efficient genome reconstruction from metagenome assemblies. PeerJ. 2019;7: e7359.","journal-title":"PeerJ"},{"issue":"4","key":"6136_CR10","doi-asserted-by":"publisher","first-page":"779","DOI":"10.1016\/j.cell.2019.07.010","volume":"178","author":"SH Ye","year":"2019","unstructured":"Ye SH, Siddle KJ, Park DJ, Sabeti PC. Benchmarking metagenomics tools for taxonomic classification. Cell. 2019;178(4):779\u201394.","journal-title":"Cell"},{"key":"6136_CR11","doi-asserted-by":"publisher","first-page":"603","DOI":"10.7717\/peerj.603","volume":"2","author":"M Imelfort","year":"2014","unstructured":"Imelfort M, Parks D, Woodcroft BJ, Dennis P, Hugenholtz P, Tyson GW. GroopM: An automated tool for the recovery of population genomes from related metagenomes. PeerJ. 2014;2:603.","journal-title":"PeerJ"},{"key":"6136_CR12","doi-asserted-by":"publisher","first-page":"836","DOI":"10.1038\/s41564-018-0171-1","volume":"3","author":"C Sieber","year":"2018","unstructured":"Sieber C, Probst A, Sharrar A, Thomas B, Hess M, Tringe S, Banfield J. Recovery of genomes from metagenomes via a dereplication, aggregation and scoring strategy. Nat Microbiol. 2018;3:836\u201343.","journal-title":"Nat Microbiol"},{"issue":"C","key":"6136_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiolchem.2022.107765","volume":"101","author":"C Shen","year":"2022","unstructured":"Shen C, Chen Y, Xiao F, Yang T, Wang X, Chen S, Tang J, Liao Z. BAT-Net: An enhanced RNA secondary structure prediction via bidirectional GRU-based network with attention mechanism. Comput Biol Chem. 2022;101(C): 107765.","journal-title":"Comput Biol Chem"},{"issue":"4","key":"6136_CR14","doi-asserted-by":"publisher","first-page":"1937","DOI":"10.1109\/JBHI.2023.3286917","volume":"28","author":"C Shen","year":"2024","unstructured":"Shen C, Mao D, Tang J, Liao Z, Chen S. Prediction of lncRNA-protein interactions based on kernel combinations and graph convolutional networks. IEEE J Biomed Health Inform. 2024;28(4):1937\u201348.","journal-title":"IEEE J Biomed Health Inform"},{"key":"6136_CR15","doi-asserted-by":"crossref","unstructured":"Akkaya UM, Kalkan H. Classification of DNA sequences with k-mers based vector representations. In: Innovations in Intelligent Systems and Applications Conference. 2021;pp. 1\u20135","DOI":"10.1109\/ASYU52992.2021.9599084"},{"issue":"1","key":"6136_CR16","first-page":"1835056","volume":"2021","author":"H Gunasekaran","year":"2021","unstructured":"Gunasekaran H, Ramalakshmi K, Rex Macedo Arokiaraj A, Deepa Kanmani S, Venkatesan C, Suresh Gnana Dhas C. Analysis of DNA sequence classification using CNN and hybrid models. Comput Math Methods Med. 2021;2021(1):1835056.","journal-title":"Comput Math Methods Med"},{"issue":"2","key":"6136_CR17","doi-asserted-by":"publisher","first-page":"888","DOI":"10.1109\/TCBB.2020.3017191","volume":"19","author":"H Bae","year":"2020","unstructured":"Bae H, Min S, Choi H-S, Yoon S. DNA Privacy: Analyzing malicious DNA sequences using deep neural networks. IEEE\/ACM Trans Comput Biol Bioinf. 2020;19(2):888\u201398.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"10","key":"6136_CR18","doi-asserted-by":"publisher","first-page":"1130","DOI":"10.2174\/1574893615666200224095531","volume":"15","author":"Z Du","year":"2021","unstructured":"Du Z, Xiao X, Uversky VN. Classification of chromosomal DNA sequences using hybrid deep learning architectures. Curr Bioinform. 2021;15(10):1130\u20136.","journal-title":"Curr Bioinform"},{"key":"6136_CR19","doi-asserted-by":"crossref","unstructured":"Rizzo R, Fiannaca A, La\u00a0Rosa M, Urso A. Classification experiments of DNA sequences by using a deep neural network and chaos game representation. In: Proceedings of the International Conference on Computer Systems and Technologies. 2016;pp. 222\u2013228","DOI":"10.1145\/2983468.2983489"},{"issue":"4","key":"6136_CR20","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1080\/15257770.2019.1645851","volume":"39","author":"SM Abd-Alhalem","year":"2020","unstructured":"Abd-Alhalem SM, Soliman NF, Eldin S, Abd Elrahman SE, Ismail NA. El-Rabaie E-SM, El-Samie FEA, Bacterial classification with convolutional neural networks based on different data reduction layers. Nucleosides, Nucleotides & Nucleic Acids. 2020;39(4):493\u2013503.","journal-title":"Nucleosides, Nucleotides & Nucleic Acids."},{"issue":"1","key":"6136_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pone.0261531","volume":"17","author":"P Mill\u00e1n Arias","year":"2022","unstructured":"Mill\u00e1n Arias P, Alipour F, Hill KA, Kari L. DeLUCS: Deep learning for unsupervised clustering of DNA sequences. PLoS ONE. 2022;17(1):1\u201325.","journal-title":"PLoS ONE"},{"issue":"12","key":"6136_CR22","doi-asserted-by":"publisher","first-page":"10466","DOI":"10.1109\/TPAMI.2024.3443141","volume":"46","author":"M Jin","year":"2024","unstructured":"Jin M, Koh HY, Wen Q, Zambon D, Alippi C, Webb GI, King I, Pan S. A survey on graph neural networks for time series: Forecasting, classification, imputation, and anomaly detection. IEEE Trans Pattern Anal Mach Intell. 2024;46(12):10466\u201385.","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"6136_CR23","first-page":"6000","volume":"30","author":"A Vaswani","year":"2017","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I. Attention is all you need. Proceedings of the International Conference on Neural Information Processing Systems. 2017;30:6000\u201310.","journal-title":"Proceedings of the International Conference on Neural Information Processing Systems"},{"key":"6136_CR24","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov A, Weissenborn D, Zhai X, Unterthiner T, Dehghani M, Minderer M, Heigold G, Gelly S, Uszkoreit J, Houlsby N. An image is worth 16x16 words: Transformers for image recognition at scale. In: Proceedings of the International Conference on Learning Representations. 2021;pp. 1\u201321"},{"key":"6136_CR25","doi-asserted-by":"crossref","unstructured":"Zhang C, Zhang M, Zhang S, Jin D, Zhou Q, Cai Z, Zhao H, Liu X, Liu Z. Delving deep into the generalization of vision transformers under distribution shifts. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2022;pp. 7277\u20137286","DOI":"10.1109\/CVPR52688.2022.00713"},{"key":"6136_CR26","unstructured":"Kenton JDM-WC, Toutanova LK. BERT: Pre-training of deep bidirectional transformers for language understanding. In: Proceedings of Annual Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 2019;pp. 4171\u20134186"},{"key":"6136_CR27","doi-asserted-by":"crossref","unstructured":"He K, Chen X, Xie S, Li Y, Doll\u00e1r P, Girshick R. Masked autoencoders are scalable vision learners. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2022;pp. 16000\u201316009","DOI":"10.1109\/CVPR52688.2022.01553"},{"issue":"1","key":"6136_CR28","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-020-03667-3","volume":"21","author":"Y Yue","year":"2020","unstructured":"Yue Y, Huang H, Qi Z, Dou H-M, Liu X-Y, Han T-F, Chen Y, Song X-J, Zhang Y-H, Tu J. Evaluating metagenomics tools for genome binning with real metagenomic datasets and CAMI datasets. BMC Bioinformatics. 2020;21(1):1\u201315.","journal-title":"BMC Bioinformatics"},{"issue":"18","key":"6136_CR29","doi-asserted-by":"publisher","first-page":"3029","DOI":"10.1093\/bioinformatics\/btab184","volume":"37","author":"M Mirdita","year":"2021","unstructured":"Mirdita M, Steinegger M, Breitwieser F, S\u00f6ding J, Levy Karin E. Fast and sensitive taxonomic assignment to metagenomic contigs. Bioinformatics. 2021;37(18):3029\u201331.","journal-title":"Bioinformatics"},{"key":"6136_CR30","doi-asserted-by":"crossref","unstructured":"Mangkunegara IS, Purwono P. Analysis of DNA sequence classification using SVM model with hyperparameter tuning grid search CV. In: Proceedings of the IEEE International Conference on Cybernetics and Computational Intelligence. 2022;pp. 427\u2013432","DOI":"10.1109\/CyberneticsCom55287.2022.9865624"},{"key":"6136_CR31","unstructured":"Habib MA, Manik MMH. Classification of DNA sequence using machine learning techniques. 2022;pp. 1\u20135"},{"issue":"1","key":"6136_CR32","doi-asserted-by":"publisher","first-page":"009","DOI":"10.1093\/nargab\/lqaa009","volume":"2","author":"Q Liang","year":"2020","unstructured":"Liang Q, Bible PW, Liu Y, Zou B, Wei L. DeepMicrobes: Taxonomic classification for metagenomics with deep learning. NAR Genomics and Bioinformatics. 2020;2(1):009.","journal-title":"NAR Genomics and Bioinformatics"},{"issue":"1","key":"6136_CR33","doi-asserted-by":"publisher","first-page":"092","DOI":"10.1093\/bioadv\/vbad092","volume":"3","author":"W Fuhl","year":"2023","unstructured":"Fuhl W, Zabel S, Nieselt K. Improving taxonomic classification with feature space balancing. Bioinformatics Advances. 2023;3(1):092.","journal-title":"Bioinformatics Advances"},{"key":"6136_CR34","unstructured":"Mikolov T, Chen K, Corrado GS, Dean J. Efficient estimation of word representations in vector space. In: Proceedings of the International Conference on Learning Representations. 2013;pp. 1\u201312"},{"key":"6136_CR35","doi-asserted-by":"crossref","unstructured":"Pennington J, Socher R, Manning CD. Glove: Global vectors for word representation. In: Proceedings of the Conference on Empirical Methods in Natural Language Processing. 2014;pp. 1532\u20131543","DOI":"10.3115\/v1\/D14-1162"},{"key":"6136_CR36","doi-asserted-by":"crossref","unstructured":"Peters ME, Neumann M, Iyyer M, Gardner M, Clark C, Lee K, Zettlemoyer L. Deep contextualized word representations. In: Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 2018;pp. 2227\u20132237","DOI":"10.18653\/v1\/N18-1202"},{"issue":"8","key":"6136_CR37","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J. Long short-term memory. Neural Comput. 1997;9(8):1735\u201380.","journal-title":"Neural Comput"},{"key":"6136_CR38","unstructured":"Radford A, Narasimhan K, Salimans T, Sutskever I, et al. Improving language understanding by generative pre-training. 2018;1\u201312"},{"issue":"35","key":"6136_CR39","doi-asserted-by":"publisher","first-page":"2122636119","DOI":"10.1073\/pnas.2122636119","volume":"119","author":"F Mock","year":"2022","unstructured":"Mock F, Kretschmer F, Kriese A, B\u00f6cker S, Marz M. Taxonomic classification of DNA sequences beyond sequence similarity using deep neural networks. Proc Natl Acad Sci. 2022;119(35):2122636119.","journal-title":"Proc Natl Acad Sci"},{"key":"6136_CR40","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li L-J, Li K, Fei-Fei L. ImageNet: A large-scale hierarchical image database. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2009;pp. 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"6136_CR41","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J. Deep residual learning for image recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2016;pp. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"issue":"5","key":"6136_CR42","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1093\/bioinformatics\/17.5.429","volume":"17","author":"JS Almeida","year":"2001","unstructured":"Almeida JS, Carri\u00e7o JA, Maretzek A, Noble PA, Fletcher M. Analysis of genomic sequences by chaos game representation. Bioinformatics. 2001;17(5):429\u201337.","journal-title":"Bioinformatics"},{"key":"6136_CR43","doi-asserted-by":"publisher","first-page":"6263","DOI":"10.1016\/j.csbj.2021.11.008","volume":"19","author":"HF L\u00f6chel","year":"2021","unstructured":"L\u00f6chel HF, Heider D. Chaos game representation and its applications in bioinformatics. Comput Struct Biotechnol J. 2021;19:6263\u201371.","journal-title":"Comput Struct Biotechnol J"},{"key":"6136_CR44","doi-asserted-by":"crossref","unstructured":"Adetiba E, Badejo J A, Thakur S, Matthews VO, Adebiyi MO, Adebiyi EF. Experimental investigation of frequency chaos game representation for in silico and accurate classification of viral pathogens from genomic sequences. In: Proceedings of the International Work-Conference on Bioinformatics and Biomedical Engineering, 2017;pp. 155\u2013164","DOI":"10.1007\/978-3-319-56148-6_13"},{"issue":"5","key":"6136_CR45","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1093\/bioinformatics\/17.5.429","volume":"17","author":"JS Almeida","year":"2001","unstructured":"Almeida JS, Carri\u00e7o JA, Maretzek A, Noble PA, Fletcher M. Analysis of genomic sequences by chaos game representation. Bioinformatics. 2001;17(5):429\u201337.","journal-title":"Bioinformatics"},{"key":"6136_CR46","unstructured":"Paszke A, Gross S, Massa F, Lerer A, Bradbury J, Chanan G, Killeen T, Lin Z, et al. Pytorch: An imperative style, high-performance deep learning library. In: Advances in Neural Information Processing Systems, vol. 32, 2019;pp. 8024\u20138035"},{"key":"6136_CR47","unstructured":"Loshchilov I, Hutter F. Decoupled weight decay regularization. In: Proceedings of the International Conference on Learning Representations. 2017;pp. 1\u201319"},{"issue":"11","key":"6136_CR48","first-page":"2579","volume":"9","author":"L Maaten","year":"2008","unstructured":"Maaten L, Hinton G. Visualizing data using t-SNE. J Mach Learn Res. 2008;9(11):2579\u2013605.","journal-title":"J Mach Learn Res"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06136-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12859-025-06136-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06136-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,9]],"date-time":"2025-05-09T17:10:50Z","timestamp":1746810650000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-025-06136-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,9]]},"references-count":48,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["6136"],"URL":"https:\/\/doi.org\/10.1186\/s12859-025-06136-x","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,9]]},"assertion":[{"value":"13 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 April 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 May 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no Conflict of interest.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"125"}}