{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,8]],"date-time":"2026-03-08T23:45:21Z","timestamp":1773013521053,"version":"3.50.1"},"reference-count":47,"publisher":"Tech Science Press","issue":"2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["CMC"],"published-print":{"date-parts":[[2025]]},"DOI":"10.32604\/cmc.2025.067390","type":"journal-article","created":{"date-parts":[[2025,7,28]],"date-time":"2025-07-28T09:10:48Z","timestamp":1753693848000},"page":"3095-3128","source":"Crossref","is-referenced-by-count":2,"title":["A Comparative Study of Data Representation Techniques for Deep Learning-Based Classification of Promoter and Histone-Associated DNA Regions"],"prefix":"10.32604","volume":"85","author":[{"given":"Sarab","family":"Almuhaideb","sequence":"first","affiliation":[]},{"given":"Najwa","family":"Altwaijry","sequence":"additional","affiliation":[]},{"given":"Isra","family":"Al-Turaiki","sequence":"additional","affiliation":[]},{"given":"Ahmad Raza","family":"Khan","sequence":"additional","affiliation":[]},{"given":"Hamza Ali","family":"Rizvi","sequence":"additional","affiliation":[]}],"member":"17807","published-online":{"date-parts":[[2025]]},"reference":[{"key":"ref1","doi-asserted-by":"crossref","first-page":"D56","DOI":"10.1093\/nar\/gkae1114","article-title":"GenBank 2025 update","volume":"53","author":"Sayers","year":"2025","journal-title":"Nucleic Acids Res"},{"key":"ref2","unstructured":"Ghosh P, Fagnan K, Connor R, Pannu R, Wheeler TJ, Pop M, et al. Contributions of the Petabyte Scale Sequence Search Codeathon toward efforts to scale sequence-based searches on SRA. arXiv:2505.06395. 2025."},{"key":"ref3","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1145\/1882471.1882478","article-title":"A brief survey on sequence classification","volume":"12","author":"Xing","year":"2010","journal-title":"ACM SIGKDD Explor Newsl"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1089\/cmb.1999.6.209","article-title":"New techniques for DNA sequence classification","volume":"6","author":"Wang","year":"1999","journal-title":"J Comput Biol J Comput Mol Cell Biol"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"1032","DOI":"10.3389\/fbioe.2020.01032","article-title":"Review on the application of machine learning algorithms in the sequence data mining of DNA","volume":"8","author":"Yang","year":"2020","journal-title":"Front Bioeng Biotechnol"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"e1835056","DOI":"10.1155\/2021\/1835056","article-title":"Analysis of DNA sequence classification using CNN and hybrid models","volume":"2021","author":"Gunasekaran","year":"2021","journal-title":"Comput Math Methods Med"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"280","DOI":"10.4236\/jbise.2016.95021","article-title":"DNA sequence classification by convolutional neural network","volume":"9","author":"Nguyen","year":"2016","journal-title":"J Biomed Sci Eng"},{"key":"ref8","series-title":"Proceedings of the 17th International Conference on Computer Systems and Technologies 2016, CompSysTech \u201916; 2016 Jun 23\u201324","first-page":"222","article-title":"Classification experiments of DNA sequences by using a deep neural network and chaos game representation","author":"Rizzo"},{"key":"ref9","series-title":"Proceedings of the 2017 International Conference on Computer and Drone Applications (IConDA); 2017 Nov 9\u201311","first-page":"60","article-title":"Evaluation of convolutionary neural networks modeling of DNA sequences using ordinal versus one-hot encoding method","author":"Choong"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"100","DOI":"10.56427\/jcbd.v4i2.762","article-title":"DNA sequence classification using machine learning models based on k-mer features","volume":"4","author":"Kautsar","year":"2025","journal-title":"J Comput Digital Busin"},{"key":"ref11","first-page":"c66","article-title":"Classification of DNA using machine learning","volume":"9","author":"Vishal","year":"2024 Apr","journal-title":"Int J Novel Res Develop (IJNRD)"},{"key":"ref12","series-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition; 2016 Jun 27\u201330","first-page":"770","article-title":"Deep residual learning for image recognition","author":"He"},{"key":"ref13","series-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition; 2016 Jun 27\u201330","first-page":"2818","article-title":"Rethinking the inception architecture for computer vision","author":"Szegedy"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"517","DOI":"10.1016\/j.cell.2005.06.026","article-title":"Genome-wide map of nucleosome acetylation and methylation in yeast","volume":"122","author":"Pokholok","year":"2005","journal-title":"Cell"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"1503229","DOI":"10.3389\/fmed.2025.1503229","article-title":"DNA sequence analysis landscape: a comprehensive review of DNA sequence analysis task types, databases, datasets, word embedding methods, and language models","volume":"12","author":"Asim","year":"2025","journal-title":"Front Med"},{"key":"ref16","first-page":"61","author":"Sastri","year":"2025","journal-title":"Computational techniques for biological sequence analysis"},{"key":"ref17","series-title":"Proceedings of the Advances in Knowledge Discovery and Data Mining, 17th Pacific-Asia Conference, PAKDD 2013; 2013 Apr 14\u201317","article-title":"Evaluation of techniques for classifying biological sequences","author":"Deshpande"},{"key":"ref18","series-title":"Proceedings of the Ninth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD \u201903; 2023 Aug 24\u201327","first-page":"436","article-title":"Frequent-subsequence-based prediction of outer membrane proteins","author":"She"},{"key":"ref19","unstructured":"RuleQuest-Research. Data Mining Tools See5 and C5.0. [cited 2022 Dec 2]. Available from: https:\/\/www.rulequest.com\/see5-info.html."},{"key":"ref20","doi-asserted-by":"crossref","first-page":"104650","DOI":"10.1016\/j.compbiomed.2021.104650","article-title":"Classification of SARS-CoV-2 and non-SARS-CoV-2 using machine learning algorithms","volume":"136","author":"Singh","year":"2021","journal-title":"Comput Biol Med"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"0011","DOI":"10.34133\/research.0011","article-title":"Biological sequence classification: a review on data and general methods","volume":"2022","author":"Ao","year":"2022","journal-title":"Research"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"107221","DOI":"10.1016\/j.compbiomed.2023.107221","article-title":"Cancer-inspired genomics mapper model for the generation of synthetic DNA sequences with desired genomics signatures","volume":"164","author":"Lazebnik","year":"2023","journal-title":"Comput Biol Med"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"5757","DOI":"10.1007\/s00521-023-09366-3","article-title":"The deep learning applications in IoT-based bio-and medical informatics: a systematic literature review","volume":"36","author":"Amiri","year":"2024","journal-title":"Neural Comput Applicat"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"2365","DOI":"10.1007\/s11030-023-10718-3","article-title":"Review and perspective on bioinformatics tools using machine learning and deep learning for predicting antiviral peptides","volume":"28","author":"Lefin","year":"2024","journal-title":"Molec Diver"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"bbae0424","DOI":"10.1093\/bib\/bbae042","article-title":"Deep learning in structural bioinformatics: current applications and future perspectives","volume":"25","author":"Kumar","year":"2024","journal-title":"Brief Bioinform"},{"key":"ref26","doi-asserted-by":"crossref","first-page":"i269","DOI":"10.1093\/bioinformatics\/btz339","article-title":"Comprehensive evaluation of deep learning architectures for prediction of DNA\/RNA sequence binding specificities","volume":"35","author":"Trabelsi","year":"2019","journal-title":"Bioinformatics"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"6009","DOI":"10.1016\/j.csbj.2021.10.034","article-title":"DCNN-4mC: densely connected neural network based N4-methylcytosine site prediction in multiple species","volume":"19","author":"Rehman","year":"2021","journal-title":"Computat Struct Biotechnol J"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"100147","DOI":"10.1016\/j.slast.2024.100147","article-title":"Assessment and classification of COVID-19 DNA sequence using pairwise features concatenation from multi-transformer and deep features with machine learning models","volume":"29","author":"Qayyum","year":"2024","journal-title":"SLAS Technol"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"e365","DOI":"10.7717\/peerj-cs.365","article-title":"Comparison of machine learning and deep learning techniques in promoter prediction across diverse species","volume":"7","author":"Bhandari","year":"2021","journal-title":"PeerJ Comput Sci"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"107040","DOI":"10.1016\/j.neunet.2024.107040","article-title":"A sparse and wide neural network model for DNA sequences","volume":"184","author":"Yu","year":"2025","journal-title":"Neural Netw"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"2397","DOI":"10.1109\/JBHI.2024.3355758","article-title":"TBCA: prediction of transcription factor binding sites using a deep neural network with lightweight attention mechanism","volume":"28","author":"Wang","year":"2024","journal-title":"IEEE J Biomed Health Inform"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"5239","DOI":"10.1007\/s11760-024-03229-7","article-title":"DeepCTF: transcription factor binding specificity prediction using DNA sequence plus shape in an attention-based deep learning model","volume":"16","author":"Tariq","year":"2024","journal-title":"Signal Image Video Process"},{"key":"ref33","volume":"15276","author":"Amato","journal-title":"Computational intelligence methods for bioinformatics and biostatistics. CIBB 2024. Lecture notes in computer science"},{"key":"ref34","doi-asserted-by":"crossref","first-page":"e2122636119","DOI":"10.1073\/pnas.2122636119","article-title":"Taxonomic classification of DNA sequences beyond sequence similarity using deep neural networks","volume":"119","author":"Mock","year":"2022","journal-title":"Proc Natl Acad Sci U S A"},{"key":"ref35","doi-asserted-by":"crossref","first-page":"107035","DOI":"10.1016\/j.cmpb.2022.107035","article-title":"Predicting gene expression levels from DNA sequences and post-transcriptional information with transformers","volume":"225","author":"Pipoli","year":"2022","journal-title":"Comput Methods Programs Biomed"},{"key":"ref36","unstructured":"Mikolov T. Efficient estimation of word representations in vector space. arXiv:1301.3781. 2023."},{"key":"ref37","doi-asserted-by":"crossref","first-page":"bbab360","DOI":"10.1093\/bib\/bbab360","article-title":"DeepLncLoc: a deep learning framework for long non-coding RNA subcellular localization prediction based on subsequence embedding","volume":"23","author":"Zeng","year":"2022","journal-title":"Brief Bioinform"},{"key":"ref38","doi-asserted-by":"crossref","first-page":"1593","DOI":"10.3390\/genes15121593","article-title":"TExCNN: leveraging pre-trained models to predict gene expression from genomic sequences","volume":"15","author":"Dong","year":"2024","journal-title":"Genes"},{"key":"ref39","doi-asserted-by":"crossref","first-page":"2112","DOI":"10.1093\/bioinformatics\/btab083","article-title":"DNABERT: pre-trained bidirectional encoder representations from transformers model for DNA-language in genome","volume":"37","author":"Ji","year":"2021","journal-title":"Bioinformatics"},{"key":"ref40","unstructured":"Zhou Z, Ji Y, Li W, Dutta P, Davuluri R, Liu H. Dnabert-2: efficient foundation model and benchmark for multi-species genome. arXiv:2306.15006. 2023."},{"key":"ref41","doi-asserted-by":"crossref","first-page":"247","DOI":"10.1007\/978-3-030-95041-5_6","author":"Kim","year":"2022","journal-title":"Artificial intelligence for 6G"},{"key":"ref42","doi-asserted-by":"crossref","first-page":"1435","DOI":"10.1126\/science.2983426","article-title":"Rapid and sensitive protein similarity searches","volume":"227","author":"Lipman","year":"1985","journal-title":"Science"},{"key":"ref43","first-page":"621","article-title":"Colorsquare: a colorful square visualization of DNA sequences","volume":"68","author":"Zhang","year":"2012","journal-title":"Match-Commun Math Comput Chem"},{"key":"ref44","doi-asserted-by":"crossref","first-page":"429","DOI":"10.1093\/bioinformatics\/17.5.429","article-title":"Analysis of genomic sequences by Chaos Game Representation","volume":"17","author":"Almeida","year":"2001","journal-title":"Bioinformatics"},{"key":"ref45","doi-asserted-by":"crossref","first-page":"427","DOI":"10.1016\/j.ipm.2009.03.002","article-title":"A systematic analysis of performance measures for classification tasks","volume":"45","author":"Sokolova","year":"2009","journal-title":"Inform Process Manag"},{"key":"ref46","author":"Nemenyi","year":"1963","journal-title":"Distribution-free multiple comparisons"},{"key":"ref47","first-page":"5907","article-title":"An improved convolutional neural network model for DNA classification","volume":"70","author":"Soliman","year":"2022","journal-title":"Comput Mater Contin"}],"container-title":["Computers, Materials &amp; Continua"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/cdn.techscience.cn\/files\/cmc\/2025\/TSP_CMC-85-2\/TSP_CMC_67390\/TSP_CMC_67390.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T05:35:41Z","timestamp":1764826541000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.techscience.com\/cmc\/v85n2\/63823"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":47,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2025]]},"published-print":{"date-parts":[[2025]]}},"URL":"https:\/\/doi.org\/10.32604\/cmc.2025.067390","relation":{},"ISSN":["1546-2226"],"issn-type":[{"value":"1546-2226","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]}}}