{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T00:01:32Z","timestamp":1762300892749,"version":"3.37.1"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2025,2,15]],"date-time":"2025-02-15T00:00:00Z","timestamp":1739577600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,2,15]],"date-time":"2025-02-15T00:00:00Z","timestamp":1739577600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SN COMPUT. SCI."],"DOI":"10.1007\/s42979-025-03709-8","type":"journal-article","created":{"date-parts":[[2025,2,15]],"date-time":"2025-02-15T09:12:36Z","timestamp":1739610756000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Class-Balanced Protein Interaction Site Prediction Using Global and Local Features with XGBoost and Deep Learning"],"prefix":"10.1007","volume":"6","author":[{"given":"Bharath C.","family":"Kulkarni","sequence":"first","affiliation":[]},{"given":"Bommineni Shiva","family":"Sai","sequence":"additional","affiliation":[]},{"given":"Varun","family":"Kolagad","sequence":"additional","affiliation":[]},{"given":"Nagamma","family":"Patil","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0004-7508-965X","authenticated-orcid":false,"given":"Prajna","family":"Bhat","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,15]]},"reference":[{"issue":"7","key":"3709_CR1","doi-asserted-by":"publisher","first-page":"3932","DOI":"10.1021\/acs.chemrev.3c00550","volume":"124","author":"G Grassmann","year":"2024","unstructured":"Grassmann G, Miotto M, Desantis F, Rienzo LD, Tartaglia GG, Pastore A, Ruocco G, Monti M, Milanetti E. Computational approaches to predict protein-protein interactions in crowded cellular environments. Chem Rev. 2024;124(7):3932\u201377.","journal-title":"Chem Rev"},{"issue":"4","key":"3709_CR2","doi-asserted-by":"publisher","DOI":"10.1016\/j.jsb.2024.108118","volume":"216","author":"S Akbarzadeh","year":"2024","unstructured":"Akbarzadeh S, Co\u015fkun \u00d6, G\u00fcn\u00e7er B. Studying protein-protein interactions: latest and most popular approaches. J Struct Biol. 2024;216(4): 108118.","journal-title":"J Struct Biol"},{"issue":"1","key":"3709_CR3","doi-asserted-by":"publisher","first-page":"474","DOI":"10.1186\/s12864-022-08687-2","volume":"23","author":"X Li","year":"2022","unstructured":"Li X, Han P, Wang G, Chen W, Wang S, Song T. SDNN-PPI: self-attention with deep neural network effect on protein-protein interaction prediction. BMC Genom. 2022;23(1):474.","journal-title":"BMC Genom"},{"key":"3709_CR4","first-page":"2200292","volume":"23","author":"N Kewalramani","year":"2023","unstructured":"Kewalramani N, Emili A, Crovella M. State-of-the-art computational methods to predict protein-protein interactions with high accuracy and coverage. Proteom Syst Biol. 2023;23:2200292.","journal-title":"Proteom Syst Biol"},{"key":"3709_CR5","doi-asserted-by":"publisher","first-page":"1761","DOI":"10.1038\/s41598-020-80900-2","volume":"11","author":"S Das","year":"2021","unstructured":"Das S, Chakrabarti S. Classification and prediction of protein-protein interaction interface using machine learning algorithm. Sci Rep. 2021;11:1761.","journal-title":"Sci Rep"},{"issue":"6","key":"3709_CR6","doi-asserted-by":"publisher","first-page":"3646","DOI":"10.1109\/TCBB.2021.3123269","volume":"19","author":"M Li","year":"2022","unstructured":"Li M, Wu Z, Wang W, Lu K, Zhang J, Zhou Y, Chen Z, Li D, Zheng S, Chen P, Wang B. Protein-protein interaction sites prediction based on an under-sampling strategy and random forest algorithm. IEEE\/ACM Trans Comput Biol Bioinf. 2022;19(6):3646\u201354.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"2","key":"3709_CR7","doi-asserted-by":"publisher","first-page":"bbad076","DOI":"10.1093\/bib\/bbad076","volume":"24","author":"T Tang","year":"2023","unstructured":"Tang T, Zhang X, Liu Y, Peng H, Zheng B, Yin Y, Zeng X. Machine learning on protein-protein interaction prediction: models, challenges and trends. Brief Bioinform. 2023;24(2):bbad076.","journal-title":"Brief Bioinform"},{"key":"3709_CR8","doi-asserted-by":"publisher","first-page":"1512","DOI":"10.1016\/j.csbj.2021.03.005","volume":"19","author":"J Sun","year":"2021","unstructured":"Sun J, Frishman D. Improved sequence-based prediction of interaction sites in a-helical transmembrane proteins by deep learning. Comput Struct Biotechnol. 2021;19:1512\u201330.","journal-title":"Comput Struct Biotechnol"},{"issue":"3","key":"3709_CR9","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1007\/s00249-021-01539-z","volume":"50","author":"RK Balogh","year":"2021","unstructured":"Balogh RK, Nemeth E, Jones NC, Hofmann SV, Jancso A, Gyurcsik B. A study on the secondary structure of the metalloregulatory protein CueR: effect of pH, metal ions and DNA. Eur Biophys J. 2021;50(3):491\u2013500.","journal-title":"Eur Biophys J"},{"issue":"9","key":"3709_CR10","doi-asserted-by":"publisher","first-page":"2452","DOI":"10.1093\/bioinformatics\/btac138","volume":"38","author":"T Zhou","year":"2022","unstructured":"Zhou T, Rong J, Liu Y, Gong W, Li C. An ensemble approach to predict binding hotspots in protein-RNA interactions based on SMOTE data balancing and Random Grouping feature selection strategies. Bioinformatics. 2022;38(9):2452\u20138.","journal-title":"Bioinformatics"},{"issue":"13","key":"3709_CR11","doi-asserted-by":"publisher","first-page":"2117","DOI":"10.3390\/cells11132117","volume":"11","author":"SH Khan","year":"2022","unstructured":"Khan SH, Tayara H, Chong KT. ProB-Site: protein binding site prediction using local features. Cells. 2022;11(13):2117.","journal-title":"Cells"},{"key":"3709_CR12","doi-asserted-by":"publisher","first-page":"4775","DOI":"10.1007\/s40747-024-01399-y","volume":"10","author":"Q Leng","year":"2024","unstructured":"Leng Q, Guo J, Meng JT, Wang C. OBMI: oversampling borderline minority instances by a two-stage Tomek link-finding procedure for class imbalance problem. Complex Intell Syst. 2024;10:4775\u201392.","journal-title":"Complex Intell Syst"},{"key":"3709_CR13","doi-asserted-by":"publisher","first-page":"15693","DOI":"10.1007\/s00521-021-06189-y","volume":"33","author":"EC Gok","year":"2021","unstructured":"Gok EC, Olgun MO. SMOTE-NC and gradient boosting imputation based random forest classifier for predicting severity level of covid-19 patients with blood samples. Neural Comput Appl. 2021;33:15693\u2013707.","journal-title":"Neural Comput Appl"},{"key":"3709_CR14","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1186\/s12911-024-02487-2","volume":"24","author":"S Cusworth","year":"2024","unstructured":"Cusworth S, Gkoutos GV, Acharjee A. A novel generative adversarial networks modelling for the class imbalance problem in high dimensional omics data. BMC Med Inform Decis Mak. 2024;24:90.","journal-title":"BMC Med Inform Decis Mak"},{"issue":"1","key":"3709_CR15","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1093\/bioinformatics\/btab643","volume":"38","author":"Q Yuan","year":"2021","unstructured":"Yuan Q, Chen J, Zhao H, Zhou Y, Yang Y. Structure-aware protein-protein interaction site prediction using deep graph convolutional network. Bioinformatics. 2021;38(1):125\u201332.","journal-title":"Bioinformatics"},{"issue":"5","key":"3709_CR16","doi-asserted-by":"publisher","first-page":"3314","DOI":"10.1109\/TCBB.2023.3265640","volume":"20","author":"Y Liu","year":"2023","unstructured":"Liu Y, Li P, Tu S, Xu L. RefinePocket: an attention-enhanced and mask-guided deep learning approach for protein binding site prediction. IEEE\/ACM Trans Comput Biol Bioinf. 2023;20(5):3314\u201321.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"7","key":"3709_CR17","doi-asserted-by":"publisher","first-page":"896","DOI":"10.1093\/bioinformatics\/btaa750","volume":"37","author":"Y Li","year":"2021","unstructured":"Li Y, Golding GB, Ilie L. DELPHI: accurate deep ensemble model for protein interaction sites prediction. Bioinformatics. 2021;37(7):896\u2013904.","journal-title":"Bioinformatics"},{"issue":"1","key":"3709_CR18","doi-asserted-by":"publisher","first-page":"16910","DOI":"10.1038\/s41598-021-96265-z","volume":"11","author":"Y Li","year":"2021","unstructured":"Li Y, Wang Z, Li LP, You ZH, Huang WZ, Zhan XK, Wang YB. Robust and accurate prediction of protein-protein interactions by exploiting evolutionary information. Sci Rep. 2021;11(1):16910.","journal-title":"Sci Rep"},{"issue":"1","key":"3709_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.xcrp.2023.101758","volume":"5","author":"H Ozawa","year":"2024","unstructured":"Ozawa H, Unno I, Sekine R, Chisuga T, Ito S, Nakano S. Development of evolutionary algorithm-based protein redesign method. Cell Rep Phys Sci. 2024;5(1): 101758.","journal-title":"Cell Rep Phys Sci"},{"issue":"6","key":"3709_CR20","doi-asserted-by":"publisher","first-page":"3588","DOI":"10.1109\/TCBB.2023.3306948","volume":"20","author":"Y Gong","year":"2023","unstructured":"Gong Y, Li R, Fu B, Liu Y, Wang J, Li R, Chen DZ. A CNN-LSTM ensemble model for predicting protein-protein interaction binding sites. IEEE\/ACM Trans Comput Biol Bioinf. 2023;20(6):3588\u201399.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"4","key":"3709_CR21","doi-asserted-by":"publisher","first-page":"1114","DOI":"10.1093\/bioinformatics\/btz699","volume":"36","author":"M Zeng","year":"2020","unstructured":"Zeng M, Zhang F, Wu FX, Li Y, Wang J, Li M. Protein-protein interaction site prediction through combining local and global features with deep neural networks. Bioinformatics. 2020;36(4):1114\u201320.","journal-title":"Bioinformatics"},{"key":"3709_CR22","volume":"139","author":"MZ Alom","year":"2021","unstructured":"Alom MZ, Akter MM, Adnan MN, Taha TM. Deep learning-based protein-protein interaction site prediction: advancements and challenges. Comput Biol Med. 2021;139: 104992.","journal-title":"Comput Biol Med"},{"issue":"3","key":"3709_CR23","doi-asserted-by":"publisher","first-page":"2190","DOI":"10.1109\/TCBB.2023.3238001","volume":"20","author":"C Jiang","year":"2023","unstructured":"Jiang C, Lv W, Li J. Protein-protein interaction sites prediction using batch normalization based cnns and oversampling method borderline-SMOTE. IEEE\/ACM Trans Comput Biol Bioinf. 2023;20(3):2190\u20139.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"9","key":"3709_CR24","doi-asserted-by":"publisher","first-page":"3246","DOI":"10.3390\/s22093246","volume":"22","author":"EF Swana","year":"2022","unstructured":"Swana EF, Doorsamy W, Bokoro P. Tomek link and SMOTE approaches for machine fault classification with an imbalanced dataset. Sensors. 2022;22(9):3246.","journal-title":"Sensors."},{"key":"3709_CR25","doi-asserted-by":"crossref","unstructured":"Ashrafi N, Schmitt V, Spang RP, M\u00f6ller S, Antons JNV. Protect and extend-using GANs for synthetic data generation of time-series medical records. In: 2023 15th International Conference on Quality of Multimedia Experience (QoMEX), Ghent, Belgium. 2023; 171-176.","DOI":"10.1109\/QoMEX58391.2023.10178496"},{"key":"3709_CR26","doi-asserted-by":"publisher","first-page":"1841","DOI":"10.1093\/bioinformatics\/btq302","volume":"26","author":"Y Murakami","year":"2010","unstructured":"Murakami Y, Mizuguchi K. Applying the Naive Bayes classifier with kernel density estimation to the prediction of protein-protein interaction sites. Bioinformatics. 2010;26:1841\u20138.","journal-title":"Bioinformatics"},{"key":"3709_CR27","doi-asserted-by":"crossref","unstructured":"Singh G, Dhole K, Pai PP, Mondal S. SPRINGS: prediction of protein-protein interaction sites using artificial neural networks. PeerJ PrePrints. 2014; p. e266v2.","DOI":"10.7287\/peerj.preprints.266v2"},{"issue":"2","key":"3709_CR28","doi-asserted-by":"publisher","first-page":"190","DOI":"10.7861\/fhj.2022-0013","volume":"9","author":"A Arora","year":"2022","unstructured":"Arora A, Arora A. Generative adversarial networks and synthetic patient data: current challenges and future perspectives. Future Healthc J. 2022;9(2):190\u20133.","journal-title":"Future Healthc J."},{"key":"3709_CR29","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1186\/s40537-024-00982-x","volume":"11","author":"INM Adiputra","year":"2024","unstructured":"Adiputra INM, Wanchai P. CTGAN-ENN: a tabular GAN-based hybrid sampling method for imbalanced and overlapped data in customer churn prediction. J Big Data. 2024;11:121.","journal-title":"J Big Data"},{"key":"3709_CR30","doi-asserted-by":"crossref","unstructured":"Bhat P, Patil N. An exhaustive review of computational prediction techniques for PPI sites, protein locations, and protein functions. Netw Model Anal Health Inform Bioinform. 2023; 12(31).","DOI":"10.1007\/s13721-023-00427-0"},{"key":"3709_CR31","doi-asserted-by":"publisher","first-page":"630","DOI":"10.1002\/prot.21248","volume":"66","author":"A Porollo","year":"2007","unstructured":"Porollo A, Meller J. Prediction-based fingerprints of protein-protein interactions. Proteins. 2007;66:630\u201345.","journal-title":"Proteins"},{"key":"3709_CR32","doi-asserted-by":"publisher","first-page":"e13","DOI":"10.1093\/bioinformatics\/btl303","volume":"23","author":"Y Ofran","year":"2007","unstructured":"Ofran Y, Rost B. ISIS: interaction sites identified from sequence. Bioinformatics. 2007;23:e13\u20136.","journal-title":"Bioinformatics"},{"issue":"10","key":"3709_CR33","doi-asserted-by":"publisher","first-page":"1479","DOI":"10.1093\/bioinformatics\/btx005","volume":"33","author":"Q Hou","year":"2017","unstructured":"Hou Q, De Geest PFG, Vranken WF, Heringa J, Feenstra KA. Seeing the trees through the forest: sequence-based homo- and heteromeric protein-protein interaction sites prediction using random forest. Bioinformatics. 2017;33(10):1479\u201387.","journal-title":"Bioinformatics"},{"issue":"6","key":"3709_CR34","doi-asserted-by":"publisher","first-page":"3820","DOI":"10.1109\/TCBB.2023.3323493","volume":"20","author":"Y Li","year":"2023","unstructured":"Li Y, Lu S, Ma Q, Nan X, Zhang S. Protein-protein interaction site prediction based on attention mechanism and convolutional neural networks. IEEE\/ACM Trans Comput Biol Bioinf. 2023;20(6):3820\u20139.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"issue":"1","key":"3709_CR35","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1109\/TCBB.2022.3154413","volume":"20","author":"K Li","year":"2023","unstructured":"Li K, Quan L, Jiang Y, Li Y, Zhou Y, Wu T, Lyu Q. ctP2ISP: protein-protein interaction sites prediction using convolution and transformer with data augmentation. IEEE\/ACM Trans Comput Biol Bioinf. 2023;20(1):297\u2013306.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinf"},{"key":"3709_CR36","doi-asserted-by":"publisher","first-page":"1393","DOI":"10.1007\/s12551-022-01038-1","volume":"14","author":"Y Murakami","year":"2022","unstructured":"Murakami Y, Mizuguchi K. Recent developments of sequence-based prediction of protein-protein interactions. Biophys Rev. 2022;14:1393\u2013411.","journal-title":"Biophys Rev"},{"key":"3709_CR37","doi-asserted-by":"crossref","unstructured":"Jamasb AR, Day B, Cangea C, Lio P, Blundell TL. Deep learning for protein-protein interaction site prediction. In: Cecconi, D. editors. Proteomics data analysis. Methods in molecular biology. 2021; p. 2361.","DOI":"10.1007\/978-1-0716-1641-3_16"},{"key":"3709_CR38","doi-asserted-by":"crossref","unstructured":"Purohit A, Acharya S, Green J. A novel Greedy approach for Sequence based Computational prediction of Binding-Sites in Protein-Protein Interaction. In: 2021 IEEE 21st International Conference on Bioinformatics and Bioengineering (BIBE), Kragujevac, Serbia. 2021; 1\u20138.","DOI":"10.1109\/BIBE52308.2021.9635163"},{"key":"3709_CR39","doi-asserted-by":"crossref","unstructured":"Lu S, Li Y, Nan X, Zhang. Attention-based convolutional neural networks for protein-protein interaction site prediction. In: Proc. IEEE Int. Conf. Bioinf. Biomed. 2021; 141\u2013144.","DOI":"10.1109\/BIBM52615.2021.9669435"},{"issue":"12","key":"3709_CR40","doi-asserted-by":"publisher","DOI":"10.3389\/fgene.2021.784863","volume":"22","author":"M Tang","year":"2021","unstructured":"Tang M, Wu L, Yu X, Chu Z, Jin S, Liu J. Prediction of protein-protein interaction sites based on stratified attentional mechanisms. Front Genet. 2021;22(12): 784863.","journal-title":"Front Genet"},{"key":"3709_CR41","first-page":"2577","volume":"22","author":"W Kabsch","year":"1983","unstructured":"Kabsch W, Sander C. Dictionary of protein secondary structure: pattern recognition of hydrogen-bonded and geometrical features. Biopolym Original Res Biomol. 1983;22:2577\u2013637.","journal-title":"Biopolym Original Res Biomol"},{"key":"3709_CR42","doi-asserted-by":"publisher","first-page":"4775","DOI":"10.1007\/s40747-024-01399-y","volume":"10","author":"Q Leng","year":"2024","unstructured":"Leng Q, Guo J, Tao J, Meng X, Wang C. OBMI: oversampling borderline minority instances by a two-stage Tomek link-finding procedure for class imbalance problem. Complex Intell Syst. 2024;10:4775\u201392.","journal-title":"Complex Intell Syst"},{"key":"3709_CR43","doi-asserted-by":"publisher","DOI":"10.3389\/fgene.2021.752732","volume":"12","author":"P Wang","year":"2021","unstructured":"Wang P, Zhang G, Yu Z-G, Huang G. A deep learning and XGBoost-based method for predicting protein-protein interaction sites. Front Genet. 2021;12: 752732.","journal-title":"Front Genet"}],"container-title":["SN Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-025-03709-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42979-025-03709-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-025-03709-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,15]],"date-time":"2025-02-15T09:12:46Z","timestamp":1739610766000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42979-025-03709-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,15]]},"references-count":43,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2025,2]]}},"alternative-id":["3709"],"URL":"https:\/\/doi.org\/10.1007\/s42979-025-03709-8","relation":{},"ISSN":["2661-8907"],"issn-type":[{"value":"2661-8907","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,15]]},"assertion":[{"value":"10 April 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 January 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 February 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors state that they have no conflicting interests concerning the material presented in this manuscript.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Inapplicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Research Involving Human and\/or Animals"}},{"value":"Inapplicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed Consent"}}],"article-number":"176"}}