{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T18:06:34Z","timestamp":1775325994926,"version":"3.50.1"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"14","license":[{"start":{"date-parts":[[2023,1,16]],"date-time":"2023-01-16T00:00:00Z","timestamp":1673827200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,16]],"date-time":"2023-01-16T00:00:00Z","timestamp":1673827200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s10489-022-04387-2","type":"journal-article","created":{"date-parts":[[2023,1,16]],"date-time":"2023-01-16T08:02:58Z","timestamp":1673856178000},"page":"17887-17902","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["DeepCF-PPI: improved prediction of protein-protein interactions by combining learned and handcrafted features based on attention mechanisms"],"prefix":"10.1007","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7976-4729","authenticated-orcid":false,"given":"Hoai-Nhan","family":"Tran","sequence":"first","affiliation":[]},{"given":"Quynh Nguyen Phuc","family":"Xuan","sequence":"additional","affiliation":[]},{"given":"Tuong-Tri","family":"Nguyen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,1,16]]},"reference":[{"key":"4387_CR1","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1007\/s12038-019-9909-z","volume":"44","author":"D Sarkar","year":"2019","unstructured":"Sarkar D, Saha S (2019) Machine-learning techniques for the prediction of protein\u2013protein interactions. J Biosci 44:4. https:\/\/doi.org\/10.1007\/s12038-019-9909-z","journal-title":"J Biosci"},{"issue":"1","key":"4387_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-017-1700-2","volume":"18","author":"T Sun","year":"2017","unstructured":"Sun T, Zhou B, Lai L, Pei J (2017) Sequence-based prediction of protein protein interaction using a deep-learning algorithm. BMC Bioinforma 18(1):1\u20138. https:\/\/doi.org\/10.1186\/s12859-017-1700-2","journal-title":"BMC Bioinforma"},{"issue":"6","key":"4387_CR3","doi-asserted-by":"publisher","first-page":"1499","DOI":"10.1021\/acs.jcim.7b00028","volume":"57","author":"X Du","year":"2017","unstructured":"Du X, Sun S, Hu C, Yao Y, Yan Y, Zhang Y (2017) DeepPPI: boosting prediction of protein-protein interactions with deep neural networks. J Chem Inf Model 57(6):1499\u20131510. https:\/\/doi.org\/10.1021\/acs.jcim.7b00028","journal-title":"J Chem Inf Model"},{"issue":"9","key":"4387_CR4","doi-asserted-by":"publisher","first-page":"3025","DOI":"10.1093\/nar\/gkn159","volume":"36","author":"Y Guo","year":"2008","unstructured":"Guo Y, Yu L, Wen Z, Li M (2008) Using support vector machine combined with auto covariance to predict protein\u2013protein interactions from protein sequences. Nucleic Acids Res 36(9):3025\u20133030. https:\/\/doi.org\/10.1093\/nar\/gkn159","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"4387_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-019-2907-1","volume":"20","author":"KH Chen","year":"2019","unstructured":"Chen KH, Wang TF, Hu YJ (2019) Protein-protein interaction prediction using a hybrid feature representation and a stacked generalization scheme. BMC Bioinforma 20(1):1\u201317. https:\/\/doi.org\/10.1186\/s12859-019-2907-1","journal-title":"BMC Bioinforma"},{"issue":"5","key":"4387_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pone.0125811","volume":"10","author":"ZH You","year":"2015","unstructured":"You ZH, Chan KCC, Hu P (2015) Predicting protein-protein interactions from primary protein sequences using a novel multi-scale local feature representation scheme and the random forest. PLoS ONE 10 (5):1\u201319. https:\/\/doi.org\/10.1371\/journal.pone.0125811","journal-title":"PLoS ONE"},{"key":"4387_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-15-S15-S9","volume":"15","author":"ZH You","year":"2014","unstructured":"You ZH, Zhu L, Zheng CH, Yu HJ, Deng SP, Ji Z (2014) Prediction of protein-protein interactions from amino acid sequences using a novel multi-scale continuous and discontinuous feature set. BMC Bioinformatics, vol.15, Suppl 15:1\u20139. https:\/\/doi.org\/10.1186\/1471-2105-15-S15-S9","journal-title":"BMC Bioinformatics, vol.15, Suppl"},{"key":"4387_CR8","doi-asserted-by":"publisher","first-page":"6","DOI":"10.7717\/peerj.7126","volume":"2019","author":"Y Yao","year":"2019","unstructured":"Yao Y, Du X, Diao Y, Zhu H (2019) An integration of deep learning with feature embedding for protein\u2013protein interaction prediction. PeerJ 2019:6. https:\/\/doi.org\/10.7717\/peerj.7126","journal-title":"PeerJ"},{"key":"4387_CR9","doi-asserted-by":"publisher","unstructured":"Zhou S, Wang S, Wu Q, Azim R, Li W (2020) Predicting potential miRNA-disease associations by combining gradient boosting decision tree with logistic regression. Comput Biol Chem, vol 85. https:\/\/doi.org\/10.1016\/j.compbiolchem.2020.107200","DOI":"10.1016\/j.compbiolchem.2020.107200"},{"key":"4387_CR10","doi-asserted-by":"publisher","first-page":"54","DOI":"10.1016\/j.chemolab.2019.06.003","volume":"191","author":"C Chen","year":"2019","unstructured":"Chen C, Zhang Q, Ma Q, Yu B (2019) LightGBM-PPI: predicting protein-protein interactions through lightGBM with multi-information fusion. Chemometr Intell Lab Syst 191:54\u201364. https:\/\/doi.org\/10.1016\/j.chemolab.2019.06.003","journal-title":"Chemometr Intell Lab Syst"},{"issue":"5","key":"4387_CR11","doi-asserted-by":"publisher","first-page":"582","DOI":"10.1016\/j.gpb.2021.01.001","volume":"18","author":"B Yu","year":"2020","unstructured":"Yu B, Chen C, Zhou H, Liu B, Ma Q (2020) GTB-PPI: predict protein\u2013protein interactions based on l1-regularized logistic regression and gradient tree boosting. Genomics, Proteomics and Bioinformatics 18(5):582\u2013592. https:\/\/doi.org\/10.1016\/j.gpb.2021.01.001","journal-title":"Genomics, Proteomics and Bioinformatics"},{"key":"4387_CR12","doi-asserted-by":"publisher","first-page":"114876","DOI":"10.1016\/j.eswa.2021.114876","volume":"176","author":"B Yu","year":"2021","unstructured":"Yu B, Chen C, Wang X, Yu Z, Ma A, Liu B (2021) Prediction of protein\u2013protein interactions based on elastic net and deep forest. Expert Syst Appl 176:114876. https:\/\/doi.org\/10.1016\/J.ESWA.2021.114876","journal-title":"Expert Syst Appl"},{"issue":"11","key":"4387_CR13","doi-asserted-by":"publisher","first-page":"4337","DOI":"10.1073\/pnas.0607879104","volume":"104","author":"J Shen","year":"2007","unstructured":"Shen J, et al. (2007) Predicting protein-protein interactions based only on sequences information. Proc Natl Acad Sci USA 104(11):4337\u20134341. https:\/\/doi.org\/10.1073\/pnas.0607879104","journal-title":"Proc Natl Acad Sci USA"},{"issue":"9","key":"4387_CR14","doi-asserted-by":"publisher","first-page":"1085","DOI":"10.2174\/092986610791760306","volume":"17","author":"L Yang","year":"2010","unstructured":"Yang L, Xia J -F, Gui J (2010) Prediction of protein-protein interactions from protein sequence using local descriptors. Protein & Peptide Letters 17(9):1085\u20131090. https:\/\/doi.org\/10.2174\/092986610791760306","journal-title":"Protein & Peptide Letters"},{"key":"4387_CR15","doi-asserted-by":"publisher","unstructured":"Zhou YZ, Gao Y, Zheng YY (2011) Prediction of protein-protein interactions using local description of amino acid sequence. In: Communications in Computer and Information Science, vol 202 CCIS, no. PART 2, pp 254\u2013262. https:\/\/doi.org\/10.1007\/978-3-642-22456-0_37","DOI":"10.1007\/978-3-642-22456-0_37"},{"issue":"10","key":"4387_CR16","doi-asserted-by":"publisher","first-page":"4992","DOI":"10.1021\/pr100618t","volume":"9","author":"XY Pan","year":"2010","unstructured":"Pan XY, Zhang YN, bin Shen H (2010) Large-scale prediction of human protein-protein interactions from amino acid sequence based on latent topic features. J Proteome Res 9(10):4992\u20135001. https:\/\/doi.org\/10.1021\/pr100618t","journal-title":"J Proteome Res"},{"key":"4387_CR17","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1371\/journal.pone.0181426","volume":"12","author":"C Zhou","year":"2017","unstructured":"Zhou C, Yu H, Ding Y, Guo F, Gong XJ (2017) Multi-scale encoding of amino acid sequences for predicting protein interactions using gradient boosting decision tree. PLoS ONE 12:8. https:\/\/doi.org\/10.1371\/journal.pone.0181426","journal-title":"PLoS ONE"},{"key":"4387_CR18","doi-asserted-by":"publisher","unstructured":"Xuan P, Sun C, Zhang T, Ye Y, Shen T, Dong Y (2019) Gradient boosting decision tree-based method for predicting interactions between target genes and drugs. Front Genet, vol 10, no. MAY. https:\/\/doi.org\/10.3389\/fgene.2019.00459","DOI":"10.3389\/fgene.2019.00459"},{"issue":"17","key":"4387_CR19","doi-asserted-by":"publisher","first-page":"i802","DOI":"10.1093\/bioinformatics\/bty573","volume":"34","author":"S Hashemifar","year":"2018","unstructured":"Hashemifar S, Neyshabur B, Khan AA, Xu J (2018) Predicting protein-protein interactions through sequence-based deep learning. Bioinformatics 34(17):i802\u2013i810. https:\/\/doi.org\/10.1093\/bioinformatics\/bty573","journal-title":"Bioinformatics"},{"key":"4387_CR20","doi-asserted-by":"publisher","unstructured":"Gonzalez-Lopez F, Morales-Cordovilla JA, Villegas-Morcillo A, Gomez AM, Sanchez V (2019) End-to-end prediction of protein-protein interaction based on embedding and recurrent neural networks. https:\/\/doi.org\/10.1109\/BIBM.2018.8621328","DOI":"10.1109\/BIBM.2018.8621328"},{"key":"4387_CR21","unstructured":"Mikolov T, Chen K, Corrado G, Dean J (2013) Efficient estimation of word representations in vector space"},{"issue":"1","key":"4387_CR22","doi-asserted-by":"publisher","first-page":"74","DOI":"10.1093\/nsr\/nwy108","volume":"6","author":"ZH Zhou","year":"2019","unstructured":"Zhou ZH, Feng J (2019) Deep forest. Natl Sci Rev 6(1):74\u201386. https:\/\/doi.org\/10.1093\/nsr\/nwy108","journal-title":"Natl Sci Rev"},{"issue":"4","key":"4387_CR23","doi-asserted-by":"publisher","first-page":"271","DOI":"10.2174\/1570164616666190306152318","volume":"17","author":"C Xu","year":"2020","unstructured":"Xu C, Jiang L, Zhang Z, Yu X, Chen R, Xu J (Jun. 2020) An integrated prediction method for identifying protein-protein interactions. Curr Proteomics 17 (4):271\u2013286. https:\/\/doi.org\/10.2174\/1570164616666190306152318","journal-title":"Curr Proteomics"},{"issue":"8","key":"4387_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3390\/molecules23081923","volume":"23","author":"H Li","year":"2018","unstructured":"Li H, Gong XJ, Yu H, Zhou C (2018) Deep neural network based predictions of protein interactions using primary sequences. Molecules 23(8):1\u201316. https:\/\/doi.org\/10.3390\/molecules23081923https:\/\/doi.org\/10.3390\/molecules23081923","journal-title":"Molecules"},{"key":"4387_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3390\/app8010089","volume":"8","author":"XY Song","year":"2018","unstructured":"Song XY, Chen ZH, Sun XY, You ZH, Li LP, Zhao Y (Jan. 2018) An ensemble classifier with random projection for predicting protein-protein interactions using sequence and evolutionary information. Applied Sciences (Switzerland) 8:1. https:\/\/doi.org\/10.3390\/app8010089","journal-title":"Applied Sciences (Switzerland)"},{"issue":"1","key":"4387_CR26","doi-asserted-by":"publisher","first-page":"398","DOI":"10.1186\/s12859-016-1253-9","volume":"17","author":"Y Ding","year":"2016","unstructured":"Ding Y, Tang J, Guo F (2016) Predicting protein-protein interactions via multivariate mutual information of protein sequences. BMC Bioinforma 17(1):398. https:\/\/doi.org\/10.1186\/s12859-016-1253-9","journal-title":"BMC Bioinforma"},{"issue":"3","key":"4387_CR27","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1609\/aimag.v18i3.1303","volume":"18","author":"TM Mitchell","year":"1997","unstructured":"Mitchell TM (1997) Does machine learning really work?. AI Mag 18(3):11\u201320. https:\/\/doi.org\/10.1609\/aimag.v18i3.1303","journal-title":"AI Mag"},{"issue":"1","key":"4387_CR28","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1093\/nar\/30.1.303","volume":"30","author":"I Xenarios","year":"2002","unstructured":"Xenarios I (2002) DIP, the database of interacting proteins: a research tool for studying cellular networks of protein interactions. Nucleic Acids Res 30(1):303\u2013305. https:\/\/doi.org\/10.1093\/nar\/30.1.303","journal-title":"Nucleic Acids Res"},{"issue":"13","key":"4387_CR29","doi-asserted-by":"publisher","first-page":"1658","DOI":"10.1093\/bioinformatics\/btl158","volume":"22","author":"W Li","year":"2006","unstructured":"Li W, Godzik A (2006) Cd-hit: a fast program for clustering and comparing large sets of protein or nucleotide sequences. Bioinformatics 22(13):1658\u20131659. https:\/\/doi.org\/10.1093\/bioinformatics\/btl158","journal-title":"Bioinformatics"},{"key":"4387_CR30","doi-asserted-by":"publisher","unstructured":"Huang YA, You ZH, Gao X, Wong L, Wang L (2015) Using weighted sparse representation model combined with discrete cosine transformation to predict protein-protein interactions from protein sequence, BioMed Research International, vol 2015. https:\/\/doi.org\/10.1155\/2015\/902198","DOI":"10.1155\/2015\/902198"},{"issue":"22","key":"4387_CR31","doi-asserted-by":"publisher","first-page":"23262","DOI":"10.1074\/jbc.M401932200","volume":"279","author":"M Bhasin","year":"2004","unstructured":"Bhasin M, Raghava GPS (2004) Classification of nuclear receptors based on amino acid composition and dipeptide composition. J Biol Chem 279(22):23262\u201323266. https:\/\/doi.org\/10.1074\/jbc.M401932200","journal-title":"J Biol Chem"},{"issue":"4","key":"4387_CR32","doi-asserted-by":"publisher","first-page":"262","DOI":"10.2174\/157016409789973707","volume":"6","author":"K-C Chou","year":"2009","unstructured":"Chou K-C (2009) Pseudo amino acid composition and its applications in bioinformatics, proteomics and system biology. Curr Proteomics 6(4):262\u2013274. https:\/\/doi.org\/10.2174\/157016409789973707","journal-title":"Curr Proteomics"},{"issue":"1","key":"4387_CR33","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1093\/bioinformatics\/bth466","volume":"21","author":"K-C Chou","year":"2005","unstructured":"Chou K-C (2005) Using amphiphilic pseudo amino acid composition to predict enzyme subfamily classes. Bioinformatics 21(1):10\u201319. https:\/\/doi.org\/10.1093\/bioinformatics\/bth466","journal-title":"Bioinformatics"},{"issue":"2","key":"4387_CR34","doi-asserted-by":"publisher","first-page":"477","DOI":"10.1006\/bbrc.2000.3815","volume":"278","author":"KC Chou","year":"2000","unstructured":"Chou KC (2000) Prediction of protein subcellular locations by incorporating quasi-sequence-order effect. Biochem Biophys Res Commun 278(2):477\u2013483. https:\/\/doi.org\/10.1006\/bbrc.2000.3815","journal-title":"Biochem Biophys Res Commun"},{"issue":"10","key":"4387_CR35","doi-asserted-by":"publisher","first-page":"648","DOI":"10.1089\/omi.2015.0095","volume":"19","author":"V Saravanan","year":"2015","unstructured":"Saravanan V, Gautham N (2015) Harnessing computational biology for exact linear B-cell epitope prediction: a novel amino acid composition-based feature descriptor. OMICS A Journal of Integrative Biology 19 (10):648\u2013658. https:\/\/doi.org\/10.1089\/omi.2015.0095","journal-title":"OMICS A Journal of Integrative Biology"},{"key":"4387_CR36","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1016\/j.ymeth.2019.04.008","volume":"166","author":"Y Li","year":"2019","unstructured":"Li Y, Huang C, Ding L, Li Z, Pan Y, Gao X (Aug. 2019) Deep learning in bioinformatics: introduction, application, and perspective in the big data era. Methods 166:4\u201321. https:\/\/doi.org\/10.1016\/j.ymeth.2019.04.008","journal-title":"Methods"},{"key":"4387_CR37","doi-asserted-by":"publisher","unstructured":"Skansi S (2018) Introduction To deep learning. Cham: springer international publishing. https:\/\/doi.org\/10.1007\/978-3-319-73004-2","DOI":"10.1007\/978-3-319-73004-2"},{"key":"4387_CR38","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1007\/s11042-019-08453-9","volume":"79","author":"C Garbin","year":"2020","unstructured":"Garbin C, Zhu X, Marques O (2020) Dropout vs. batch normalization: an empirical study of their impact to deep learning. Multimed Tools Appl 79:19\u201320. https:\/\/doi.org\/10.1007\/s11042-019-08453-9","journal-title":"Multimed Tools Appl"},{"key":"4387_CR39","unstructured":"Rehurek R, Sojka P (2011) Gensim-python framework for vector space modelling. NLP Centre, Faculty of Informatics, Masaryk University, Brno, Czech Republic, vol 3, 2"},{"key":"4387_CR40","unstructured":"Abadi M, et al. (2016) TensorFlow: a system for large-scale machine learning. In: Proceedings of the 12th USENIX Symposium on Operating Systems Design and Implementation OSDI"},{"key":"4387_CR41","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, et al. (2011) Scikit-learn: machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"issue":"October","key":"4387_CR42","doi-asserted-by":"publisher","first-page":"277","DOI":"10.1016\/j.neucom.2016.10.042","volume":"228","author":"ZH You","year":"2017","unstructured":"You ZH, Li X, Chan KC (2017) An improved sequence-based prediction protocol for protein-protein interactions using amino acids substitution matrix and rotation forest ensemble classifiers. Neurocomputing 228(October):277\u2013282. https:\/\/doi.org\/10.1016\/j.neucom.2016.10.042","journal-title":"Neurocomputing"},{"issue":"1","key":"4387_CR43","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41598-021-96265-z","volume":"11","author":"Y Li","year":"2021","unstructured":"Li Y, et al. (2021) Robust and accurate prediction of protein\u2013protein interactions by exploiting evolutionary information. Sci Rep 11(1):1\u201312. https:\/\/doi.org\/10.1038\/s41598-021-96265-z","journal-title":"Sci Rep"},{"key":"4387_CR44","doi-asserted-by":"publisher","unstructured":"Shrestha A, Mahmood A (2019) Review of deep learning algorithms and architectures. vol 7. https:\/\/doi.org\/10.1109\/ACCESS.2019.2912200","DOI":"10.1109\/ACCESS.2019.2912200"},{"key":"4387_CR45","doi-asserted-by":"publisher","unstructured":"Jurtz VI, et al. (2017) An introduction to deep learning on biological sequence data: examples and solutions. Bioinformatics, vol 33, 22. https:\/\/doi.org\/10.1093\/bioinformatics\/btx531","DOI":"10.1093\/bioinformatics\/btx531"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-022-04387-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-022-04387-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-022-04387-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,4]],"date-time":"2023-07-04T12:17:43Z","timestamp":1688473063000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-022-04387-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,16]]},"references-count":45,"journal-issue":{"issue":"14","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["4387"],"URL":"https:\/\/doi.org\/10.1007\/s10489-022-04387-2","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,1,16]]},"assertion":[{"value":"5 December 2022","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 January 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"The authors declare that they have no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Competing interests"}}]}}