{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T16:09:49Z","timestamp":1774282189618,"version":"3.50.1"},"reference-count":56,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T00:00:00Z","timestamp":1771027200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T00:00:00Z","timestamp":1774224000000},"content-version":"vor","delay-in-days":37,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cloud Comp"],"DOI":"10.1186\/s13677-026-00852-2","type":"journal-article","created":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T02:24:38Z","timestamp":1771035878000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Cloud-assisted LLM-enhanced datasets for AST hierarchy-aware code summarization model"],"prefix":"10.1186","volume":"15","author":[{"given":"Junsan","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yudie","family":"Yan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junxiao","family":"Han","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ao","family":"Lu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Juncai","family":"Guo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Javad","family":"Pourzamani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,14]]},"reference":[{"key":"852_CR1","doi-asserted-by":"publisher","first-page":"2179","DOI":"10.1007\/s10664-019-09730-9","volume":"25","author":"X Hu","year":"2020","unstructured":"Hu X, Li G, Xia X, Lo D, Jin Z (2020) Deep code comment generation with hybrid lexical and syntactical information. Empirical Softw Eng 25:2179\u20132217","journal-title":"Empirical Softw Eng"},{"key":"852_CR2","doi-asserted-by":"crossref","unstructured":"Song J, Zhang Z, Tang Z, Feng S, Gu Y (2024) Improving code summarization with tree transformer enhanced by position-related syntax complement. IEEE Trans Artif Intel","DOI":"10.1109\/TAI.2024.3395231"},{"key":"852_CR3","doi-asserted-by":"publisher","first-page":"102058","DOI":"10.1016\/j.inffus.2023.102058","volume":"103","author":"J Guo","year":"2024","unstructured":"Guo J, Liu J, Liu X, Li L (2024) Summarizing source code through heterogeneous feature fusion and extraction. Inf Fusion 103:102058","journal-title":"Inf Fusion"},{"key":"852_CR4","doi-asserted-by":"crossref","unstructured":"Hu X, Li G, Xia X, Lo D, Jin Z (2018) Deep code comment generation. In Proceedings of the 26th Conference on Program Comprehension, pp 200\u2013210","DOI":"10.1145\/3196321.3196334"},{"key":"852_CR5","doi-asserted-by":"crossref","unstructured":"Tang Z, Shen X, Li C, Ge J, Huang L, Zhu Z, Luo B (2022) Ast-trans: code summarization with efficient tree-structured attention. In Proceedings of the 44th International Conference on Software Engineering, pp 150\u2013162","DOI":"10.1145\/3510003.3510224"},{"key":"852_CR6","doi-asserted-by":"crossref","unstructured":"Guo J, Liu J, Wan Y, Li L, Zhou P (2022) Modeling hierarchical syntax structure with triplet position for source code summarization. In Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp 486\u2013500","DOI":"10.18653\/v1\/2022.acl-long.37"},{"key":"852_CR7","doi-asserted-by":"crossref","unstructured":"Hu X, Li G, Xia X, Lo D, Lu S, Jin Z (2018) Summarizing source code with transferred api knowledge","DOI":"10.24963\/ijcai.2018\/314"},{"key":"852_CR8","doi-asserted-by":"crossref","unstructured":"Wan Y, Zhao Z, Yang M, Xu G, Ying H, Wu J, Yu PS (2018) Improving automatic source code summarization via deep reinforcement learning. In Proceedings of the 33rd ACM\/IEEE International Conference on Automated Software Engineering, pp 397\u2013407","DOI":"10.1145\/3238147.3238206"},{"key":"852_CR9","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1016\/j.neucom.2019.11.067","volume":"385","author":"L Qiao","year":"2020","unstructured":"Qiao L, Li X, Umer Q, Guo P (2020) Deep learning based software defect prediction. Neurocomputing 385:100\u2013110","journal-title":"Neurocomputing"},{"issue":"9","key":"852_CR10","first-page":"1811","volume":"47","author":"H Liu","year":"2019","unstructured":"Liu H, Jin J, Xu Z, Zou Y, Bu Y, Zhang L (2019) Deep learning based code smell detection. IEEE Trans Softw Eng 47(9):1811\u20131837","journal-title":"IEEE Trans Softw Eng"},{"key":"852_CR11","doi-asserted-by":"crossref","unstructured":"LeClair A, Haque S, Wu L, McMillan C (2020) Improved code summarization via a graph neural network. In Proceedings of the 28th International Conference on Program Comprehension, pp 184\u2013195","DOI":"10.1145\/3387904.3389268"},{"issue":"1","key":"852_CR12","doi-asserted-by":"publisher","first-page":"18","DOI":"10.26599\/TST.2023.9010158","volume":"30","author":"X Wang","year":"2024","unstructured":"Wang X, Ma J (2024) Cloud-network-end collaborative security for wireless networks: architecture, mechanisms, and applications. Tsinghua Sci Technol 30(1):18\u201333","journal-title":"Tsinghua Sci Technol"},{"key":"852_CR13","unstructured":"Rossi E, Charpentier B, Di Giovanni F, Frasca F, G\u00fcnnemann S, Bronstein MM (2024) Edge directionality improves learning on heterophilic graphs. In Learning on Graphs Conference, PMLR, pp. 25\u20131"},{"key":"852_CR14","doi-asserted-by":"crossref","unstructured":"LeClair A, McMillan C (2019). Recommendations for datasets for source code summarization. arXiv preprint arXiv:1904.02660","DOI":"10.18653\/v1\/N19-1394"},{"issue":"2","key":"852_CR15","doi-asserted-by":"publisher","first-page":"908","DOI":"10.26599\/TST.2024.9010101","volume":"30","author":"S Alyahyan","year":"2024","unstructured":"Alyahyan S, Alatawi MN, Alnfiai MM, Alotaibi SD, Alshammari A, Alzaid Z, Alwageed HS (2024) Software reliability assessment: an architectural and component impact analysis. Tsinghua Sci Technol 30(2):908\u2013925","journal-title":"Tsinghua Sci Technol"},{"key":"852_CR16","doi-asserted-by":"crossref","unstructured":"Wang S, Liu T, Tan L (2016) Automatically learning semantic features for defect prediction. In Proceedings of the 38th International Conference on Software Engineering, pp 297\u2013308","DOI":"10.1145\/2884781.2884804"},{"issue":"4","key":"852_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3212695","volume":"51","author":"M Allamanis","year":"2018","unstructured":"Allamanis M, Barr ET, Devanbu P, Sutton C (2018) A survey of machine learning for big code and naturalness. ACM Comput Surv (CSUR) 51(4):1\u201337","journal-title":"ACM Comput Surv (CSUR)"},{"key":"852_CR18","unstructured":"Wei B, Li G, Xia X, Fu Z, Jin Z (2019) Code generation as a dual task of code summarization. Adv Neural Inf Process Syst 32"},{"key":"852_CR19","doi-asserted-by":"crossref","unstructured":"Iyer S, Konstas I, Cheung A, Zettlemoyer L (2016) Summarizing source code using a neural attention model. In 54th Annual Meeting of the Association for Computational Linguistics 2016, Association for Computational Linguistics, pp. 2073\u20132083","DOI":"10.18653\/v1\/P16-1195"},{"key":"852_CR20","doi-asserted-by":"crossref","unstructured":"Ahmad WU, Chakraborty S, Ray B, Chang K-W (2020). A transformer-based approach for source code summarization. arXiv preprint arXiv:2005.00653","DOI":"10.18653\/v1\/2020.acl-main.449"},{"key":"852_CR21","unstructured":"Wang W, Zhang Y, Zeng Z, Xu G (2020). Trans 3: a transformer-based framework for unifying code summarization and code search. arXiv preprint arXiv:2003.03238"},{"key":"852_CR22","unstructured":"Alon U, Brody S, Levy O, Yahav E (2018). code2seq: generating sequences from structured representations of code. arXiv preprint arXiv:1808.01400"},{"key":"852_CR23","unstructured":"Hamilton W, Ying Z, Leskovec J (2017) Inductive representation learning on large graphs. Adv Neural Inf Process Syst 30"},{"issue":"4","key":"852_CR24","doi-asserted-by":"publisher","first-page":"765","DOI":"10.3390\/electronics13040765","volume":"13","author":"Q Zhang","year":"2024","unstructured":"Zhang Q, Jin D, Wang Y, Gong Y (2024) Statement-grained hierarchy enhanced code summarization. Electronics 13(4):765","journal-title":"Electronics"},{"key":"852_CR25","doi-asserted-by":"crossref","unstructured":"Wu H, Zhao H, Zhang M (2020). Code summarization with structure-induced transformer. arXiv preprint arXiv:2012.14710","DOI":"10.18653\/v1\/2021.findings-acl.93"},{"key":"852_CR26","doi-asserted-by":"crossref","unstructured":"Gu J, Salza P, Gall HC (2022) Assemble foundation models for automatic code summarization. In 2022 IEEE International Conference on Software Analysis, Evolution and Reengineering (SANER), IEEE, pp. 935\u2013946","DOI":"10.1109\/SANER53432.2022.00112"},{"issue":"8","key":"852_CR27","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford A, Wu J, Child R, Luan D, Amodei D, Sutskever I et al. (2019) Language models are unsupervised multitask learners. OpenAI Blog 1(8):9","journal-title":"OpenAI Blog"},{"key":"852_CR28","doi-asserted-by":"crossref","unstructured":"Gao Y, Lyu C (2022) M2ts: multi-scale multi-modal approach based on transformer for source code summarization. In Proceedings of the 30th IEEE\/ACM International Conference on Program Comprehension, pp 24\u201335","DOI":"10.1145\/3524610.3527907"},{"key":"852_CR29","unstructured":"Lee J, Toutanova K (2018) Pre-training of deep bidirectional transformers for language understanding. arXiv Prepr arXiv: 1810.04805 3(8)"},{"key":"852_CR30","doi-asserted-by":"crossref","unstructured":"Jiang B, Zhang Z, Lin D, Tang J, Luo B (2019) Semi-supervised learning with graph learning-convolutional networks. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 11313\u201311320","DOI":"10.1109\/CVPR.2019.01157"},{"key":"852_CR31","doi-asserted-by":"crossref","unstructured":"Wang Y, Dong Y, Lu X, Zhou A (2022) Gypsum: learning hybrid representations for code summarization. In Proceedings of the 30th IEEE\/ACM International Conference on Program Comprehension, pp 12\u201323","DOI":"10.1145\/3524610.3527903"},{"key":"852_CR32","doi-asserted-by":"crossref","unstructured":"Zhu S, Li J, Peng H, Wang S, He L (2021) Adversarial directed graph embedding. In Proceedings of the AAAI Conference on Artificial Intelligence, vol 35. pp 4741\u20134748","DOI":"10.1609\/aaai.v35i5.16605"},{"issue":"5","key":"852_CR33","doi-asserted-by":"publisher","first-page":"1174","DOI":"10.26599\/BDMA.2025.9020006","volume":"8","author":"Y Liu","year":"2025","unstructured":"Liu Y, Yi S, Chen X, Guo W, He L (2025) Biological knowledge graph-enhanced cancer state prediction network with adjustable connections. Big Data Min Analytics 8(5):1174\u20131188","journal-title":"Big Data Min Analytics"},{"issue":"2","key":"852_CR34","doi-asserted-by":"publisher","first-page":"926","DOI":"10.26599\/TST.2024.9010140","volume":"30","author":"X Liu","year":"2024","unstructured":"Liu X, Lv J, Kim B-G, Li K, Jin H, Gao W, Bai J (2024) Cooperative digital healthcare task scheduling and resource management in edge intelligence systems. Tsinghua Sci Technol 30(2):926\u2013945","journal-title":"Tsinghua Sci Technol"},{"key":"852_CR35","first-page":"1877","volume":"33","author":"T Brown","year":"2020","unstructured":"Brown T, Mann B, Ryder N, Subbiah M, Kaplan JD, Dhariwal P, Neelakantan A, Shyam P, Sastry G, Askell A et al. (2020) Language models are few-shot learners. Adv Neural Inf Process Syst 33:1877\u20131901","journal-title":"Adv Neural Inf Process Syst"},{"issue":"240","key":"852_CR36","first-page":"1","volume":"24","author":"A Chowdhery","year":"2023","unstructured":"Chowdhery A, Narang S, Devlin J, Bosma M, Mishra G, Roberts A, Barham P, Chung HW, Sutton C, Gehrmann S et al. (2023) Palm: scaling language modeling with pathways. J Mach Learn Res 24(240):1\u2013113","journal-title":"J Mach Learn Res"},{"key":"852_CR37","unstructured":"Touvron H, Lavril T, Izacard G, Martinet X, Lachaux M-A, Lacroix T, Rozi\u00e8re B, Goyal N, Hambro E, Azhar F, et al. (2023). Llama: open and efficient foundation language models. arXiv preprint arXiv:2302.13971"},{"issue":"1","key":"852_CR38","doi-asserted-by":"publisher","first-page":"145","DOI":"10.26599\/BDMA.2024.9020049","volume":"8","author":"J Zhao","year":"2024","unstructured":"Zhao J, Kong L, Lv J (2024) An overview of deep neural networks for few-shot learning. Big Data Min Analytics 8(1):145\u2013188","journal-title":"Big Data Min Analytics"},{"key":"852_CR39","unstructured":"OpenAI (2024 June) Gpt-4o mini: advancing cost-efficient intelligence. Technical report, OpenAI"},{"key":"852_CR40","doi-asserted-by":"crossref","unstructured":"Choi Y, Bak J, Na C, Lee J-H (2021) Learning sequential and structural information for source code summarization. In Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021, pp 2842\u20132851","DOI":"10.18653\/v1\/2021.findings-acl.251"},{"key":"852_CR41","unstructured":"Cai T, Luo S, Xu K, He D, Liu T-Y, Wang L (2021) Graphnorm: a principled approach to accelerating graph neural network training. In International Conference on Machine Learning, PMLR, pp. 1204\u20131215"},{"key":"852_CR42","unstructured":"Barone AVM, Sennrich R (2017). A parallel corpus of python functions and documentation strings for automated code documentation and code generation. arXiv preprint arXiv:1707.02275"},{"key":"852_CR43","unstructured":"Zheng J, Cao B, Ma Z, Pan R, Lin H, Lu Y, Han X, Sun L (2024). Beyond correctness: benchmarking multi-dimensional code generation for large language models. arXiv preprint arXiv:2407.11470"},{"key":"852_CR44","doi-asserted-by":"crossref","unstructured":"Zhang J, Lu A, Han J, Zhu Y, Yan Y, Guo J, Wan Y (2025) Hesqlnet: a heterogeneous graph neural network for sql-to-text generation. Inf Softw Technol 107820","DOI":"10.1016\/j.infsof.2025.107820"},{"key":"852_CR45","doi-asserted-by":"crossref","unstructured":"Papineni K, Roukos S, Ward T, Zhu W-J (2002) Bleu: a method for automatic evaluation of machine translation. In Proceedings of the 40th Annual Meeting of the Association for Computational Linguistics, pp 311\u2013318","DOI":"10.3115\/1073083.1073135"},{"key":"852_CR46","unstructured":"Banerjee S, Lavie A (2005) Meteor: an automatic metric for mt evaluation with improved correlation with human judgments. In Proceedings of the Acl Workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation And\/or Summarization, pp 65\u201372"},{"key":"852_CR47","unstructured":"Lin C-Y (2004) Rouge: a package for automatic evaluation of summaries. In Text Summarization Branches Out, pp 74\u201381"},{"key":"852_CR48","doi-asserted-by":"crossref","unstructured":"Eriguchi A, Hashimoto K, Tsuruoka Y (2016). Tree-to-sequence attentional neural machine translation. arXiv preprint arXiv:1603.06075","DOI":"10.18653\/v1\/P16-1078"},{"key":"852_CR49","doi-asserted-by":"crossref","unstructured":"Gong Z, Gao C, Wang Y, Gu W, Peng Y, Xu Z (2022) Source code summarization with structural relative position guided transformer. In 2022 IEEE International Conference on Software Analysis, Evolution and Reengineering (SANER), IEEE, pp. 13\u201324","DOI":"10.1109\/SANER53432.2022.00013"},{"key":"852_CR50","doi-asserted-by":"crossref","unstructured":"Feng Z, Guo D, Tang D, Duan N, Feng X, Gong M, Shou L, Qin B, Liu T, Jiang D, et al. (2020). Codebert: a pre-trained model for programming and natural languages. arXiv preprint arXiv:2002.08155","DOI":"10.18653\/v1\/2020.findings-emnlp.139"},{"key":"852_CR51","doi-asserted-by":"crossref","unstructured":"Wang Y, Wang W, Joty S, Hoi SC (2021). Codet5: identifier-aware unified pre-trained encoder-decoder models for code understanding and generation. arXiv preprint arXiv:2109.00859","DOI":"10.18653\/v1\/2021.emnlp-main.685"},{"key":"852_CR52","doi-asserted-by":"crossref","unstructured":"Fang C, Sun W, Chen Y, Chen X, Wei Z, Zhang Q, You Y, Luo B, Liu Y, Chen Z (2024) Esale: enhancing code-summary alignment learning for source code summarization. IEEE Trans Softw Eng","DOI":"10.1109\/TSE.2024.3422274"},{"key":"852_CR53","doi-asserted-by":"crossref","unstructured":"Sun W, Miao Y, Li Y, Zhang H, Fang C, Liu Y, Deng G, Liu Y, Chen Z (2024). Source code summarization in the era of large language models. arXiv preprint arXiv:2407.07959","DOI":"10.1109\/ICSE55347.2025.00034"},{"key":"852_CR54","doi-asserted-by":"crossref","unstructured":"Shi E, Wang Y, Du L, Chen J, Han S, Zhang H, Zhang D, Sun H (2022) On the evaluation of neural code summarization. In Proceedings of the 44th International Conference on Software Engineering, pp 1597\u20131608","DOI":"10.1145\/3510003.3510060"},{"issue":"4","key":"852_CR55","doi-asserted-by":"publisher","first-page":"1098","DOI":"10.26599\/BDMA.2024.9020037","volume":"7","author":"S Wang","year":"2024","unstructured":"Wang S, Wang C, Dong T, He Y, Xiao K (2024) Personalized privacy-preserving data utilization approach powered by distributed-gan. Big Data Min Analytics 7(4):1098\u20131113","journal-title":"Big Data Min Analytics"},{"issue":"3","key":"852_CR56","doi-asserted-by":"publisher","first-page":"699","DOI":"10.26599\/BDMA.2024.9020023","volume":"7","author":"K Zhang","year":"2024","unstructured":"Zhang K, Tsai P-W, Tian J, Zhao W, Cai X, Gao L, Chen J (2024) Towards privacy in decentralized iot: a blockchain-based dual response dp mechanism. Big Data Min Analytics 7(3):699\u2013717","journal-title":"Big Data Min Analytics"}],"container-title":["Journal of Cloud Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13677-026-00852-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13677-026-00852-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13677-026-00852-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T15:42:35Z","timestamp":1774280555000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s13677-026-00852-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,14]]},"references-count":56,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["852"],"URL":"https:\/\/doi.org\/10.1186\/s13677-026-00852-2","relation":{},"ISSN":["2192-113X"],"issn-type":[{"value":"2192-113X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,14]]},"assertion":[{"value":"9 December 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"The authors declare no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests."}}],"article-number":"44"}}