{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,5]],"date-time":"2026-02-05T23:25:01Z","timestamp":1770333901235,"version":"3.49.0"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,2,10]],"date-time":"2025-02-10T00:00:00Z","timestamp":1739145600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,2,10]],"date-time":"2025-02-10T00:00:00Z","timestamp":1739145600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62302317"],"award-info":[{"award-number":["62302317"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Project of Guangdong Provincial Key Laboratory of Novel Security Intelligence Technologies","award":["2022B1212010005"],"award-info":[{"award-number":["2022B1212010005"]}]},{"name":"Shenzhen Colleges and Universities Stable Support Program","award":["20220715183602001"],"award-info":[{"award-number":["20220715183602001"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"DOI":"10.1186\/s12859-025-06059-7","type":"journal-article","created":{"date-parts":[[2025,2,10]],"date-time":"2025-02-10T12:01:22Z","timestamp":1739188882000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["SEGT-GO: a graph transformer method based on PPI serialization and explanatory artificial intelligence for protein function prediction"],"prefix":"10.1186","volume":"26","author":[{"given":"Yansong","family":"Wang","sequence":"first","affiliation":[]},{"given":"Yundong","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Baohui","family":"Lin","sequence":"additional","affiliation":[]},{"given":"Haotian","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Xiaoling","family":"Luo","sequence":"additional","affiliation":[]},{"given":"Yumeng","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Xiaopeng","family":"Jin","sequence":"additional","affiliation":[]},{"given":"Dongjie","family":"Zhu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,10]]},"reference":[{"issue":"3","key":"6059_CR1","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1093\/bib\/bbad117","volume":"24","author":"Q Yuan","year":"2023","unstructured":"Yuan Q, Xie J, Xie J, Zhao H, Yang Y. Fast and accurate protein function prediction from sequence through pretrained language model and homology-based label diffusion. Brief Bioinform. 2023;24(3):117.","journal-title":"Brief Bioinform"},{"issue":"10","key":"6059_CR2","doi-asserted-by":"publisher","first-page":"637","DOI":"10.1093\/bioinformatics\/btad637","volume":"39","author":"P Jiao","year":"2023","unstructured":"Jiao P, Wang B, Wang X, Liu B, Wang Y, Li J. Struct2go: protein function prediction based on graph pooling algorithm and alphafold2 structure information. Bioinformatics. 2023;39(10):637.","journal-title":"Bioinformatics"},{"issue":"6306","key":"6059_CR3","doi-asserted-by":"publisher","first-page":"1420","DOI":"10.1126\/science.aaf1420","volume":"353","author":"M Costanzo","year":"2016","unstructured":"Costanzo M, VanderSluis B, Koch EN, Baryshnikova A, Pons C, Tan G, Wang W, Usaj M, Hanchard J, Lee SD, et al. A global genetic interaction network maps a wiring diagram of cellular function. Science. 2016;353(6306):1420.","journal-title":"Science"},{"key":"6059_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13059-016-1037-6","volume":"17","author":"Y Jiang","year":"2016","unstructured":"Jiang Y, Oron TR, Clark WT, Bankapur AR, D\u2019Andrea D, Lepore R, Funk CS, Kahanda I, Verspoor KM, Ben-Hur A, et al. An expanded evaluation of protein function prediction methods shows an improvement in accuracy. Genome Biol. 2016;17:1\u201319.","journal-title":"Genome Biol"},{"key":"6059_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13059-019-1835-8","volume":"20","author":"N Zhou","year":"2019","unstructured":"Zhou N, Jiang Y, Bergquist TR, Lee AJ, Kacsoh BZ, Crocker AW, Lewis KA, Georghiou G, Nguyen HN, Hamid MN, et al. The CAFA challenge reports improved protein function prediction and new functional annotations for hundreds of genes through experimental screens. Genome Biol. 2019;20:1\u201323.","journal-title":"Genome Biol"},{"key":"6059_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12864-018-5024-z","volume":"19","author":"W Qiao","year":"2018","unstructured":"Qiao W, Akhter N, Fang X, Maximova T, Plaku E, Shehu A. From mutations to mechanisms and dysfunction via computation and mining of protein energy landscapes. BMC Genom. 2018;19:1\u201313.","journal-title":"BMC Genom"},{"issue":"1","key":"6059_CR7","doi-asserted-by":"publisher","first-page":"3198","DOI":"10.1038\/s41598-021-82410-1","volume":"11","author":"IA Guedes","year":"2021","unstructured":"Guedes IA, Barreto AM, Marinho D, Krempser E, Kuenemann MA, Sperandio O, Dardenne LE, Miteva MA. New machine learning and physics-based scoring functions for drug discovery. Sci Rep. 2021;11(1):3198.","journal-title":"Sci Rep"},{"issue":"8","key":"6059_CR8","doi-asserted-by":"publisher","first-page":"3149","DOI":"10.1021\/acs.jcim.4c00115","volume":"64","author":"J Chang","year":"2024","unstructured":"Chang J, Fan X, Tian B. Deepp450: predicting human p450 activities of small molecules by integrating pretrained protein language model and molecular representation. J Chem Inf Model. 2024;64(8):3149\u201360.","journal-title":"J Chem Inf Model"},{"issue":"4","key":"6059_CR9","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1093\/bib\/bbae289","volume":"25","author":"B Lin","year":"2024","unstructured":"Lin B, Luo X, Liu Y, Jin X. A comprehensive review and comparison of existing computational methods for protein function prediction. Brief Bioinform. 2024;25(4):289.","journal-title":"Brief Bioinform"},{"issue":"10","key":"6059_CR10","doi-asserted-by":"publisher","first-page":"4957","DOI":"10.1109\/JBHI.2022.3163150","volume":"26","author":"R Dhanuka","year":"2022","unstructured":"Dhanuka R, Tripathi A, Singh JP. A semi-supervised autoencoder-based approach for protein function prediction. IEEE J Biomed Health Inform. 2022;26(10):4957\u201365.","journal-title":"IEEE J Biomed Health Inform"},{"issue":"22","key":"6059_CR11","doi-asserted-by":"publisher","first-page":"3873","DOI":"10.1093\/bioinformatics\/bty440","volume":"34","author":"V Gligorijevi\u0107","year":"2018","unstructured":"Gligorijevi\u0107 V, Barot M, Bonneau R. deepnf: deep network fusion for protein function prediction. Bioinformatics. 2018;34(22):3873\u201381.","journal-title":"Bioinformatics"},{"key":"6059_CR12","unstructured":"Kipf TN, Welling M. Semi-supervised classification with graph convolutional networks. In: International Conference on Learning Representations (2022)"},{"issue":"1","key":"6059_CR13","doi-asserted-by":"publisher","first-page":"262","DOI":"10.1093\/bioinformatics\/btab270","volume":"37","author":"R You","year":"2021","unstructured":"You R, Yao S, Mamitsuka H, Zhu S. Deepgraphgo: graph neural network for large-scale, multispecies protein function prediction. Bioinformatics. 2021;37(1):262\u201371.","journal-title":"Bioinformatics"},{"key":"6059_CR14","doi-asserted-by":"publisher","DOI":"10.1109\/JBHI.2024.3357834","author":"Y Zhao","year":"2024","unstructured":"Zhao Y, Yang Z, Wang L, Zhang Y, Lin H, Wang J. Predicting protein functions based on heterogeneous graph attention technique. IEEE J Biomed Health Inform. 2024. https:\/\/doi.org\/10.1109\/JBHI.2024.3357834.","journal-title":"IEEE J Biomed Health Inform"},{"issue":"5","key":"6059_CR15","doi-asserted-by":"publisher","first-page":"1595","DOI":"10.1109\/TETCI.2023.3249255","volume":"7","author":"K Bose","year":"2023","unstructured":"Bose K, Das S. Can graph neural networks go deeper without over-smoothing? Yes, with a randomized path exploration! IEEE Trans Emerg Top Comput Intell. 2023;7(5):1595\u2013604.","journal-title":"IEEE Trans Emerg Top Comput Intell."},{"issue":"7","key":"6059_CR16","first-page":"7192","volume":"35","author":"Y Sun","year":"2022","unstructured":"Sun Y, Zhu D, Du H, Tian Z. MHNF: multi-hop heterogeneous neighborhood information fusion graph representation learning. IEEE Trans Knowl Data Eng. 2022;35(7):7192\u2013205.","journal-title":"IEEE Trans Knowl Data Eng."},{"key":"6059_CR17","first-page":"7793","volume":"33","author":"J Zhu","year":"2020","unstructured":"Zhu J, Yan Y, Zhao L, Heimann M, Akoglu L, Koutra D. Beyond homophily in graph neural networks: current limitations and effective designs. Adv Neural Inf Process Syst. 2020;33:7793\u2013804.","journal-title":"Adv Neural Inf Process Syst"},{"key":"6059_CR18","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2024.106645","volume":"181","author":"Y Sun","year":"2024","unstructured":"Sun Y, Zhu D, Wang Y, Fu Y, Tian Z. GTC: gnn-transformer co-contrastive learning for self-supervised heterogeneous graph representation. Neural Netw. 2024;181: 106645.","journal-title":"Neural Netw"},{"key":"6059_CR19","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I. Attention is all you need. Advances in neural information processing systems. 30 (2017)"},{"key":"6059_CR20","doi-asserted-by":"crossref","unstructured":"Ahmadi N, Sand H, Papotti P. Unsupervised matching of data and text. In: 2022 IEEE 38th International Conference on Data Engineering (ICDE), pp. 1058\u20131070. IEEE (2022)","DOI":"10.1109\/ICDE53745.2022.00084"},{"key":"6059_CR21","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov A, Weissenborn D, Zhai X, Unterthiner T, Dehghani M, Minderer M, Heigold G, Gelly S, Uszkoreit J, Houlsby N. An image is worth 16x16 words: transformers for image recognition at scale. In: International Conference on Learning Representations (2021)"},{"key":"6059_CR22","first-page":"14541","volume":"35","author":"Z Pan","year":"2022","unstructured":"Pan Z, Cai J, Zhuang B. Fast vision transformers with HILO attention. Adv Neural Inf Process Syst. 2022;35:14541\u201354.","journal-title":"Adv Neural Inf Process Syst"},{"issue":"3","key":"6059_CR23","doi-asserted-by":"publisher","first-page":"094","DOI":"10.1093\/bioinformatics\/btad094","volume":"39","author":"T Pan","year":"2023","unstructured":"Pan T, Li C, Bi Y, Wang Z, Gasser RB, Purcell AW, Akutsu T, Webb GI, Imoto S, Song J. Pfresgo: an attention mechanism-based deep-learning approach for protein annotation by integrating gene ontology inter-relationships. Bioinformatics. 2023;39(3):094.","journal-title":"Bioinformatics"},{"key":"6059_CR24","first-page":"1","volume":"11","author":"E Strumbelj","year":"2010","unstructured":"Strumbelj E, Kononenko I. An efficient explanation of individual classifications using game theory. J Mach Learn Res. 2010;11:1\u201318.","journal-title":"J Mach Learn Res."},{"issue":"6","key":"6059_CR25","doi-asserted-by":"publisher","first-page":"556","DOI":"10.1093\/bib\/bbab556","volume":"24","author":"X Zhang","year":"2023","unstructured":"Zhang X, Guo H, Zhang F, Wang X, Wu K, Qiu S, Liu B, Wang Y, Hu Y, Li J. Hnetgo: protein function prediction via heterogeneous network transformer. Brief Bioinform. 2023;24(6):556.","journal-title":"Brief Bioinform"},{"issue":"D1","key":"6059_CR26","doi-asserted-by":"publisher","first-page":"435","DOI":"10.1093\/nar\/gkx1069","volume":"46","author":"TE Lewis","year":"2018","unstructured":"Lewis TE, Sillitoe I, Dawson N, Lam SD, Clarke T, Lee D, Orengo C, Lees J. Gene3d: extensive prediction of globular domains in proteins. Nucl Acids Res. 2018;46(D1):435\u20139.","journal-title":"Nucl Acids Res"},{"issue":"D1","key":"6059_CR27","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1093\/nar\/gkw1129","volume":"45","author":"A Marchler-Bauer","year":"2017","unstructured":"Marchler-Bauer A, Bo Y, Han L, He J, Lanczycki CJ, Lu S, Chitsaz F, Derbyshire MK, Geer RC, Gonzales NR, et al. Cdd\/sparcle: functional classification of proteins via subfamily domain architectures. Nucl Acids Res. 2017;45(D1):200\u20133.","journal-title":"Nucl Acids Res"},{"issue":"D1","key":"6059_CR28","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1093\/nar\/gkv1344","volume":"44","author":"RD Finn","year":"2016","unstructured":"Finn RD, Coggill P, Eberhardt RY, Eddy SR, Mistry J, Mitchell AL, Potter SC, Punta M, Qureshi M, Sangrador-Vegas A, et al. The pfam protein families database: towards a more sustainable future. Nucleic Acids Res. 2016;44(D1):279\u201385.","journal-title":"Nucleic Acids Res"},{"issue":"9","key":"6059_CR29","doi-asserted-by":"publisher","first-page":"1236","DOI":"10.1093\/bioinformatics\/btu031","volume":"30","author":"P Jones","year":"2014","unstructured":"Jones P, Binns D, Chang H-Y, Fraser M, Li W, McAnulla C, McWilliam H, Maslen J, Mitchell A, Nuka G, et al. Interproscan 5: genome-scale protein function classification. Bioinformatics. 2014;30(9):1236\u201340.","journal-title":"Bioinformatics"},{"issue":"D1","key":"6059_CR30","doi-asserted-by":"publisher","first-page":"506","DOI":"10.1093\/nar\/gky1049","volume":"47","author":"U Consortium","year":"2019","unstructured":"Consortium U. Uniprot: a worldwide hub of protein knowledge. Nucl Acids Res. 2019;47(D1):506\u201315.","journal-title":"Nucl Acids Res."},{"issue":"3","key":"6059_CR31","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1093\/bioinformatics\/btad123","volume":"39","author":"Z Wu","year":"2023","unstructured":"Wu Z, Guo M, Jin X, Chen J, Liu B. CFAGO: cross-fusion of network and attributes based on attention mechanism for protein function prediction. Bioinformatics. 2023;39(3):123.","journal-title":"Bioinformatics"},{"issue":"7","key":"6059_CR32","doi-asserted-by":"publisher","first-page":"410","DOI":"10.1093\/bioinformatics\/btad410","volume":"39","author":"Z Gu","year":"2023","unstructured":"Gu Z, Luo X, Chen J, Deng M, Lai L. Hierarchical graph transformer with contrastive learning for protein function prediction. Bioinformatics. 2023;39(7):410.","journal-title":"Bioinformatics"},{"key":"6059_CR33","doi-asserted-by":"crossref","unstructured":"Chen J, Gao K, Li G, He K. NAGphormer: A tokenized graph transformer for node classification in large graphs. In: The Eleventh International Conference on Learning Representations (2023)","DOI":"10.1109\/TBDATA.2024.3524081"},{"key":"6059_CR34","unstructured":"Xiong R, Yang Y, He D, Zheng K, Zheng S, Xing C, Zhang H, Lan Y, Wang L, Liu T. On layer normalization in the transformer architecture. In: International Conference on Machine Learning, pp. 10524\u201310533. PMLR (2020)"},{"key":"6059_CR35","unstructured":"Velickovic P, Cucurull G, Casanova A, Romero A, Li\u00f2 P, Bengio Y. Graph attention networks. In: International Conference on Learning Representations (2018)"},{"key":"6059_CR36","doi-asserted-by":"crossref","unstructured":"Gilpin LH, Bau D, Yuan BZ, Bajwa A, Specter M, Kagal L. Explaining explanations: An overview of interpretability of machine learning. In: 2018 IEEE 5th International Conference on Data Science and Advanced Analytics (DSAA), pp. 80\u201389. IEEE (2018)","DOI":"10.1109\/DSAA.2018.00018"},{"key":"6059_CR37","unstructured":"Loshchilov I, Hutter F. Decoupled weight decay regularization. In: International Conference on Learning Representations (2018)"},{"issue":"W1","key":"6059_CR38","doi-asserted-by":"publisher","first-page":"379","DOI":"10.1093\/nar\/gkz388","volume":"47","author":"R You","year":"2019","unstructured":"You R, Yao S, Xiong Y, Huang X, Sun F, Mamitsuka H, Zhu S. Netgo: improving large-scale protein function prediction with massive network information. Nucl Acids Res. 2019;47(W1):379\u201387.","journal-title":"Nucl Acids Res"},{"issue":"14","key":"6059_CR39","doi-asserted-by":"publisher","first-page":"2465","DOI":"10.1093\/bioinformatics\/bty130","volume":"34","author":"R You","year":"2018","unstructured":"You R, Zhang Z, Xiong Y, Sun F, Mamitsuka H, Zhu S. Golabeler: improving sequence-based large-scale protein function prediction by learning to rank. Bioinformatics. 2018;34(14):2465\u201373.","journal-title":"Bioinformatics"},{"issue":"2","key":"6059_CR40","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1093\/bioinformatics\/btz595","volume":"36","author":"M Kulmanov","year":"2020","unstructured":"Kulmanov M, Hoehndorf R. Deepgoplus: improved protein function prediction from sequence. Bioinformatics. 2020;36(2):422\u20139.","journal-title":"Bioinformatics"},{"issue":"2","key":"6059_CR41","doi-asserted-by":"publisher","first-page":"077","DOI":"10.1093\/bib\/bbae077","volume":"25","author":"W Li","year":"2024","unstructured":"Li W, Wang B, Dai J, Kou Y, Chen X, Pan Y, Hu S, Xu ZZ. Partial order relation-based gene ontology embedding improves protein function prediction. Brief Bioinform. 2024;25(2):077.","journal-title":"Brief Bioinform"},{"issue":"4","key":"6059_CR42","doi-asserted-by":"publisher","first-page":"364","DOI":"10.1093\/comjnl\/20.4.364","volume":"20","author":"D Defays","year":"1977","unstructured":"Defays D. An efficient algorithm for a complete link method. Comput J. 1977;20(4):364\u20136.","journal-title":"Comput J"},{"key":"6059_CR43","volume":"1566","author":"M Faisal","year":"2020","unstructured":"Faisal M, Zamzami E, et al. Comparative analysis of inter-centroid k-means performance using Euclidean distance, Canberra distance and Manhattan distance. J Phys: Conf Ser. 2020;1566: 012112.","journal-title":"J Phys: Conf Ser"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06059-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s12859-025-06059-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-025-06059-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,10]],"date-time":"2025-02-10T12:01:35Z","timestamp":1739188895000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-025-06059-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,10]]},"references-count":43,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["6059"],"URL":"https:\/\/doi.org\/10.1186\/s12859-025-06059-7","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,10]]},"assertion":[{"value":"5 November 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 January 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 February 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare that they have no Conflict of interest.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing\u00a0 interests"}}],"article-number":"46"}}