{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T15:24:12Z","timestamp":1772119452700,"version":"3.50.1"},"reference-count":69,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T00:00:00Z","timestamp":1767916800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T00:00:00Z","timestamp":1767916800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100000780","name":"European Union","doi-asserted-by":"crossref","award":["101189664"],"award-info":[{"award-number":["101189664"]}],"id":[{"id":"10.13039\/501100000780","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100000780","name":"European Union","doi-asserted-by":"crossref","award":["101189664"],"award-info":[{"award-number":["101189664"]}],"id":[{"id":"10.13039\/501100000780","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100000780","name":"European Union","doi-asserted-by":"crossref","award":["101189664"],"award-info":[{"award-number":["101189664"]}],"id":[{"id":"10.13039\/501100000780","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100003407","name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","doi-asserted-by":"publisher","award":["P2022553SL"],"award-info":[{"award-number":["P2022553SL"]}],"id":[{"id":"10.13039\/501100003407","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003407","name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","doi-asserted-by":"publisher","award":["P2022553SL"],"award-info":[{"award-number":["P2022553SL"]}],"id":[{"id":"10.13039\/501100003407","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003407","name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","doi-asserted-by":"publisher","award":["P2022553SL"],"award-info":[{"award-number":["P2022553SL"]}],"id":[{"id":"10.13039\/501100003407","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Autom Softw Eng"],"published-print":{"date-parts":[[2026,12]]},"DOI":"10.1007\/s10515-025-00588-4","type":"journal-article","created":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T05:37:27Z","timestamp":1767937047000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Automated summarization of software documents: an LLM-based multi-agent approach"],"prefix":"10.1007","volume":"33","author":[{"given":"Duc S. H.","family":"Nguyen","sequence":"first","affiliation":[]},{"given":"Minh T.","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Phuong T.","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Juri","family":"Di Rocco","sequence":"additional","affiliation":[]},{"given":"Davide","family":"Di Ruscio","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,9]]},"reference":[{"key":"588_CR1","doi-asserted-by":"publisher","unstructured":"Allix, K., Bissyand\u00e9, T.F., Klein, J., Le\u00a0Traon, Y.: Androzoo: Collecting millions of android apps for the research community. In: Proceedings of the 13th International Conference on Mining Software Repositories. MSR \u201916, pp. 468\u2013471. New York, NY, USA. ACM (2016). ISBN 978-1-4503-4186-8. https:\/\/doi.org\/10.1145\/2901739.2903508. http:\/\/doi.acm.org\/10.1145\/2901739.2903508","DOI":"10.1145\/2901739.2903508"},{"key":"588_CR2","doi-asserted-by":"publisher","unstructured":"Aly, W.M., Soliman, T.H.A., AbdelAziz, A.M.: Cross-domain evaluation of large language models for abstractive text summarization: An empirical perspective. Int. J. Adv. Comput. Sci. Appl. 16(6) (2025). https:\/\/doi.org\/10.14569\/IJACSA.2025.0160695","DOI":"10.14569\/IJACSA.2025.0160695"},{"key":"588_CR3","doi-asserted-by":"crossref","unstructured":"Arawjo, I., Swoopes, C., Vaithilingam, P., Wattenberg, M., Glassman, E.L.: Chainforge: A visual toolkit for prompt engineering and llm hypothesis testing. In: Proceedings of the 2024 CHI Conference on Human Factors in Computing Systems, pp. 1\u201318 (2024)","DOI":"10.1145\/3613904.3642016"},{"key":"588_CR4","doi-asserted-by":"publisher","unstructured":"Chen, S., Xie, X., Yin, B., Ji, Y., Chen, L., Xu, B.: Stay professional and efficient: Automatically generate titles for your bug reports. In: Proceedings of the 35th IEEE\/ACM International Conference on Automated Software Engineering. ASE \u201920, pp. 385\u2013397. New York, NY, USA. Association for Computing Machinery (2021). ISBN 9781450367684. https:\/\/doi.org\/10.1145\/3324884.3416538","DOI":"10.1145\/3324884.3416538"},{"key":"588_CR5","doi-asserted-by":"publisher","unstructured":"Choi, J., Yun, J., Jin, K., Kim, Y.: Multi-news+: Cost-efficient dataset cleansing via LLM-based data annotation. In: Al-Onaizan, Y., Bansal, M., Chen, Y.-N. (eds.) Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, pp. 15\u201329. Miami, Florida, USA. Association for Computational Linguistics (2024). https:\/\/doi.org\/10.18653\/v1\/2024.emnlp-main.2.","DOI":"10.18653\/v1\/2024.emnlp-main.2"},{"key":"588_CR6","doi-asserted-by":"publisher","unstructured":"Cinkusz, K., Chudziak, J.A.: Agile software management with cognitive multi-agent systems. In: Proceedings of the 17th International Conference on Agents and Artificial Intelligence (ICAART 2025) - Volume 1, pp. 385\u2013392. SCITEPRESS (2025). ISBN 978-989-758-737-5. https:\/\/doi.org\/10.5220\/0013153000003890","DOI":"10.5220\/0013153000003890"},{"key":"588_CR7","unstructured":"Contributors, P.: Fine-tuning llama2 with lora (2024). https:\/\/pytorch.org\/torchtune\/stable\/tutorials\/lora_finetune.html"},{"key":"588_CR8","unstructured":"Cui, W., Li, Z., Sun, H., Lopez, D., Das, K., Malin, B., Kumar, S., Zhang, J.: See: Strategic exploration and exploitation for cohesive in-context prompt optimization. arXiv:2402.11347 (2025). https:\/\/arxiv.org\/abs\/2402.11347"},{"issue":"9","key":"588_CR9","doi-asserted-by":"publisher","first-page":"389","DOI":"10.3390\/fi17090389","volume":"17","author":"A Dharrao","year":"2025","unstructured":"Dharrao, A., Shantharajah, S.P., Bhat, R.R.: A comparative study of pegasus, bart, and t5 for text summarization across diverse datasets. Future Internet 17(9), 389 (2025)","journal-title":"Future Internet"},{"key":"588_CR10","doi-asserted-by":"publisher","unstructured":"Doan, T.T.H., Nguyen, P.T., Di\u00a0Rocco, J., Di\u00a0Ruscio, D.: Too long; didn\u2019t read: Automatic summarization of GitHub README.MD with Transformers. In: Proceedings of the 27th International Conference on Evaluation and Assessment in Software Engineering. EASE \u201923, pp. 267\u2013272. New York, NY, USA. Association for Computing Machinery (2023). ISBN 9798400700446. https:\/\/doi.org\/10.1145\/3593434.3593448","DOI":"10.1145\/3593434.3593448"},{"key":"588_CR11","doi-asserted-by":"crossref","unstructured":"Fakhoury, S., Naik, A., Sakkas, G., Chakraborty, S., Lahiri, S.K.: Llm-based test-driven interactive code generation: User study and empirical evaluation. IEEE Trans. Softw. Eng. (2024)","DOI":"10.1109\/TSE.2024.3428972"},{"key":"588_CR12","unstructured":"Foland, A.: An automated length-aware quality metric for summarization (2025)"},{"key":"588_CR13","unstructured":"Golchin, S., Surdeanu, M.: Time travel in llms: Tracing data contamination in large language models. In: Proceedings of the International Conference on Learning Representations (ICLR 2024). Vienna, Austria. OpenReview (2024). https:\/\/arxiv.org\/abs\/2308.08493. Published as a conference paper at ICLR 2024"},{"key":"588_CR14","doi-asserted-by":"crossref","unstructured":"Gu, Q.: Llm-based code generation method for golang compiler testing. In: Proceedings of the 31st ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering, pp. 2201\u20132203 (2023)","DOI":"10.1145\/3611643.3617850"},{"key":"588_CR15","unstructured":"Haldar, R., Hockenmaier, J.: Analyzing the performance of large language models on code summarization. In: Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024), pp. 995\u20131008 (2024)"},{"key":"588_CR16","doi-asserted-by":"publisher","unstructured":"He, J., Treude, C., Lo, D.: Llm-based multi-agent systems for software engineering: Literature review, vision and the road ahead. ACM Trans. Softw. Eng. Methodol. (2025). ISSN 1049-331X. https:\/\/doi.org\/10.1145\/3712003. Just Accepted","DOI":"10.1145\/3712003"},{"key":"588_CR17","unstructured":"Hong, S., Zhuge, M., Chen, J., Zheng, X., Cheng, Y., Wang, J., Zhang, C., Wang, Z., Yau, S.K.S., Lin, Z., Zhou, L., Ran, C., Xiao, L., Wu, C., Schmidhuber, J.: Metagpt: Meta programming for a multi-agent collaborative framework. In: Proceedings of the Twelfth International Conference on Learning Representations (ICLR) (2024). https:\/\/openreview.net\/forum?id=VtmBAGCN7o"},{"key":"588_CR18","doi-asserted-by":"crossref","unstructured":"Huang, D., Zhang, J.M., Bu, Q., Xie, X., Chen, J., Cui, H.: Bias testing and mitigation in llm-based code generation. ACM Trans. Softw. Eng. Methodology (2024)","DOI":"10.1145\/3724117"},{"key":"588_CR19","unstructured":"Kan\u00e9, H., Kocyigit, M.Y., Ajanoh, P., Abdalla, A., Coulibali, M.: Towards neural similarity evaluator. arXiv:1909.09268 (2019). https:\/\/api.semanticscholar.org\/CorpusID:213355380"},{"key":"588_CR20","unstructured":"Kasai, J., Sakaguchi, K., Le\u00a0Bras, R., Radev, D., Choi, Y., Smith, N.A.: A call for clarity in beam search: How it works and when it stops. In: Calzolari, N., Kan, M.-Y., Hoste, V., Lenci, A., Sakti, S., Xue, N. (eds.) Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024), pp. 77\u201390. Torino, Italia (2024). ELRA and ICCL. https:\/\/aclanthology.org\/2024.lrec-main.7\/"},{"key":"588_CR21","doi-asserted-by":"crossref","unstructured":"Keya, F., Jaradeh, M.Y., Auer, S.: Leveraging LLMs for Scientific Abstract Summarization: Unearthing the Essence of Research in a Single Sentence. Association for Computing Machinery, New York, NY, USA (2025). ISBN 9798400710933. https:\/\/doi-org.univaq.idm.oclc.org\/10.1145\/3677389.3702588","DOI":"10.1145\/3677389.3702588"},{"key":"588_CR22","doi-asserted-by":"publisher","unstructured":"Khan, R., Sharma, S., Upadhyay, D.: Extracting abstractive summaries through generative ai models. In: 2025 3rd International Conference on Disruptive Technologies (ICDT), pp. 671\u2013676 (2025). https:\/\/doi.org\/10.1109\/ICDT63985.2025.10986332","DOI":"10.1109\/ICDT63985.2025.10986332"},{"key":"588_CR23","unstructured":"Khanzadeh, S.: Agentmesh: A cooperative multi-agent generative ai framework for software development automation (2025). https:\/\/arxiv.org\/abs\/2507.19902v1"},{"key":"588_CR24","doi-asserted-by":"crossref","unstructured":"Khoee, A.G., Yu, Y., Feldt, R., Freimanis, A., Rhodin, P.A., Parthasarathy, D.: Gonogo: An efficient llm-based multi-agent system for streamlining automotive software release decision-making. arXiv:2408.09785 (2024). https:\/\/arxiv.org\/abs\/2408.09785","DOI":"10.1007\/978-3-031-80889-0_3"},{"key":"588_CR25","doi-asserted-by":"crossref","unstructured":"Kim, H., Kim, B.-H.: Nexussum: Hierarchical llm agents for long-form narrative summarization (2025). https:\/\/arxiv.org\/abs\/2505.24575","DOI":"10.18653\/v1\/2025.acl-long.500"},{"key":"588_CR26","unstructured":"Kong, M., Wang, Z., Shu, Y., Dai, Z.: Meta-prompt optimization for llm-based sequential decision making. arXiv:2502.00728 (2025). https:\/\/arxiv.org\/abs\/2502.00728"},{"key":"588_CR27","doi-asserted-by":"publisher","unstructured":"Krishna, K., Zhao, Y., Ren, J., Lakshminarayanan, B., Luo, J., Saleh, M., Liu, P.: Improving the robustness of summarization models by detecting and removing input noise. In: Bouamor, H., Pino, J., Bali, K. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2023, pp. 1324\u20131336. Singapore. Association for Computational Linguistics (2023). https:\/\/doi.org\/10.18653\/v1\/2023.findings-emnlp.93.","DOI":"10.18653\/v1\/2023.findings-emnlp.93"},{"key":"588_CR28","doi-asserted-by":"crossref","unstructured":"Lee, J.Y., Kang, S., Yoon, J., Yoo, S.: The github recent bugs dataset for evaluating llm-based debugging applications. In: 2024 IEEE Conference on Software Testing, Verification and Validation (ICST), pp. 442\u2013444. IEEE (2024)","DOI":"10.1109\/ICST60714.2024.00049"},{"key":"588_CR29","unstructured":"Li, G., Hammoud, H.A.A.K., Itani, H., Khizbullin, D., Ghanem, B.: Camel: Communicative agents for \u201dmind\u201d exploration of large language model society. In: Proceedings of the 37th International Conference on Neural Information Processing Systems (NeurIPS). New Orleans, LA, USA. Curran Associates Inc. (2024). Article 2264, 18 pages"},{"key":"588_CR30","doi-asserted-by":"crossref","unstructured":"Li, M., Li, D., Liu, J., Cao, J., Tian, Y., Cheung, S.-C.: Enhancing differential testing with llms for testing deep learning libraries. ACM Trans. Softw. Eng. Methodology (2025a)","DOI":"10.1145\/3735637"},{"key":"588_CR31","doi-asserted-by":"publisher","unstructured":"Li, R., Zhang, Y., Zhou, X., Liang, P., Sun, W., Xuan, J., Jin, Z., Liu, Y.: Maad: Automate software architecture design through knowledge-driven multi-agent collaboration. ACM Trans. Softw. Eng. Methodology 0(0):0 (2025b). https:\/\/doi.org\/10.1145\/nnnnnnn.nnnnnnn.","DOI":"10.1145\/nnnnnnn.nnnnnnn"},{"key":"588_CR32","unstructured":"Lin, C.-Y.: ROUGE: A package for automatic evaluation of summaries. In: Text Summarization Branches Out, pp. 74\u201381. Barcelona, Spain. Association for Computational Linguistics (2004). https:\/\/aclanthology.org\/W04-1013"},{"key":"588_CR33","doi-asserted-by":"publisher","unstructured":"Liu, D., Demberg, V.: RST-LoRA: A discourse-aware low-rank adaptation for long document abstractive summarization. In: Duh, K., Gomez, H., Bethard, S. (eds.) Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers), pp. 2200\u20132220. Mexico City, Mexico. Association for Computational Linguistics (2024). https:\/\/doi.org\/10.18653\/v1\/2024.naacl-long.121.","DOI":"10.18653\/v1\/2024.naacl-long.121"},{"key":"588_CR34","doi-asserted-by":"publisher","unstructured":"Liu, Y., Liu, L., Liu, H., Wang, X., Yang, H.: Mining domain knowledge from app descriptions. J. Syst. Softw. 133, 126\u2013144 (2017). ISSN 0164-1212. https:\/\/doi.org\/10.1016\/j.jss.2017.08.024.","DOI":"10.1016\/j.jss.2017.08.024"},{"key":"588_CR35","doi-asserted-by":"publisher","unstructured":"Liu, Y., Noei, E., Lyons, K.: How readme files are structured in open source java projects. Inf. Softw. Technol. 148, 106924 (2022). ISSN 0950-5849. https:\/\/doi.org\/10.1016\/j.infsof.2022.106924.","DOI":"10.1016\/j.infsof.2022.106924"},{"key":"588_CR36","unstructured":"Lu, Z., Li, X., Cai, D., Yi, R., Liu, F., Zhang, X., Lane, N.D., Xu, M.: Small language models: Survey, measurements, and insights. arXiv:2409.15790 (2024)"},{"key":"588_CR37","unstructured":"Mei, A., Kabir, A., Bapat, R., Judge, J., Sun, T., Wang, W.Y.: Learning to prioritize: Precision-driven sentence filtering for long text summarization. In: Calzolari, N., B\u00e9chet, F., Blache, P., Choukri, K., Cieri, C., Declerck, T., Goggi, S., Isahara, H., Maegaard, B., Mariani, J., Mazo, H., Odijk, J., Piperidis, S. (eds.) Proceedings of the Thirteenth Language Resources and Evaluation Conference, pp. 313\u2013318. Marseille, France. European Language Resources Association (2022). https:\/\/aclanthology.org\/2022.lrec-1.33\/"},{"key":"588_CR38","doi-asserted-by":"crossref","unstructured":"Narayan, S., Cohen, S.B., Lapata, M.: Don\u2019t give me the details, just the summary! topic-aware convolutional neural networks for extreme summarization. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pp. 1797\u20131807. Association for Computational Linguistics (2018)","DOI":"10.18653\/v1\/D18-1206"},{"key":"588_CR39","doi-asserted-by":"publisher","unstructured":"Ng, J.-P., Abrecht, V.: Better summarization evaluation with word embeddings for ROUGE. In: M\u00e0rquez, L., Callison-Burch, C., Su, J. (eds.) Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, pp. 1925\u20131930. Lisbon, Portugal. Association for Computational Linguistics (2015). https:\/\/doi.org\/10.18653\/v1\/D15-1222.","DOI":"10.18653\/v1\/D15-1222"},{"key":"588_CR40","doi-asserted-by":"publisher","unstructured":"Nguyen, D.S.H., Truong, B.G., Nguyen, P.T., Di\u00a0Rocco, J., Di\u00a0Ruscio, D.: Teamwork makes the dream work: LLMs-Based Agents for GitHub README.MD Summarization. In: Proceedings of the 33rd ACM International Conference on the Foundations of Software Engineering. FSE Companion \u201925, pp. 621\u2013625. New York, NY, USA. Association for Computing Machinery (2025). ISBN 9798400712760. https:\/\/doi.org\/10.1145\/3696630.3728511","DOI":"10.1145\/3696630.3728511"},{"key":"588_CR41","doi-asserted-by":"publisher","unstructured":"Nguyen, P.T., Di Rocco, J., Di Sipio, C., Rubei, R., Di Ruscio, D., Di Penta, M.: GPTSniffer: A CodeBERT-based classifier to detect source code written by ChatGPT. J. Syst. Softw. 214, 112059 (2024). ISSN 0164-1212. https:\/\/doi.org\/10.1016\/j.jss.2024.112059.","DOI":"10.1016\/j.jss.2024.112059"},{"issue":"3","key":"588_CR42","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1109\/MS.2023.3248401","volume":"40","author":"I Ozkaya","year":"2023","unstructured":"Ozkaya, I.: Application of large language models to software engineering tasks: Opportunities, risks, and implications. IEEE Softw. 40(3), 4\u20138 (2023). https:\/\/doi.org\/10.1109\/MS.2023.3248401","journal-title":"IEEE Softw."},{"key":"588_CR43","unstructured":"Pan, L., Wu, Y., Liu, Y., Sun, M., Gong, Y., Yang, Z., Jiang, D.: Mamm-refine: Faithful multi-agent summarization with automatic mistake mining and self-refinement. arXiv:2503.15272 (2024). https:\/\/arxiv.org\/abs\/2503.15272"},{"key":"588_CR44","doi-asserted-by":"publisher","unstructured":"Pham, M.-Q., Indurthi, S., Chollampatt, S., Turchi, M.: Select, prompt, filter: Distilling large language models for summarizing conversations. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 12257\u201312265. Singapore. Association for Computational Linguistics (2023). https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.753.","DOI":"10.18653\/v1\/2023.emnlp-main.753"},{"key":"588_CR45","doi-asserted-by":"crossref","unstructured":"Rasheed, Z., Sami, A.M., Kemell, K.-K., Waseem, M., Saari, M., Syst\u00e4, K., Abrahamsson, P.: Codepori: Large-scale system for autonomous software development using multi-agent technology. Inf. Softw. Technol. (2024). https:\/\/arxiv.org\/abs\/2402.01411. arXiv:2402.01411","DOI":"10.2139\/ssrn.4979510"},{"key":"588_CR46","unstructured":"Shen, M., Shu, R., Pratik, A., Gung, J., Ge, Y., Sunkara, M., Zhang, Y.: Optimizing llm-based multi-agent system with textual feedback: A case study on software development. In: AI Agents: Capabilities and Safety Workshop @ Conference on Language Modeling (COLM) (2025). https:\/\/arxiv.org\/abs\/2505.16086"},{"key":"588_CR47","doi-asserted-by":"publisher","unstructured":"Shi, L. Mu, F., Chen, X., Wang, S., Wang, J., Yang, Y., Li, G., Xia, X., Wang, Q.: Are we building on the rock? on the importance of data preprocessing for code summarization. In: Proceedings of the 30th ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering. ESEC\/FSE 2022, pp. 107\u2013119. New York, NY, USA. Association for Computing Machinery (2022). ISBN 9781450394130. https:\/\/doi.org\/10.1145\/3540250.3549145","DOI":"10.1145\/3540250.3549145"},{"key":"588_CR48","doi-asserted-by":"publisher","unstructured":"Silva, A.R.S., Priyadarshana, Y.H.P.P.: Ontology-based prompt tuning for news article summarization. Frontiers in Artificial Intelligence Volume 8 - 2025 (2025). ISSN 2624-8212. https:\/\/doi.org\/10.3389\/frai.2025.1520144.","DOI":"10.3389\/frai.2025.1520144"},{"key":"588_CR49","doi-asserted-by":"crossref","unstructured":"Sun, W., Miao, Y., Li, Y., Zhang, H., Fang, C., Liu, Y., Deng, G., Liu, Y., Chen, Z.: Source code summarization in the era of large language models. arXiv:2407.07959 (2024)","DOI":"10.1109\/ICSE55347.2025.00034"},{"key":"588_CR50","unstructured":"Takeshita, S., Ponzetto, S.P., Eckert, K.: IRSum: One model to rule summarization and retrieval. In: Arviv, O., Clinciu, M., Dhole, K., Dror, R., Gehrmann, S., Habba, E., Itzhak, I., Mille, S., Perlitz, Y., Santus, E., Sedoc, J., Shmueli\u00a0Scheuer, M., Stanovsky, G., Tafjord, O. (eds.) Proceedings of the Fourth Workshop on Generation, Evaluation and Metrics (GEM$$^{2}$$), pp. 262\u2013275. Vienna, Austria and virtual meeting. Association for Computational Linguistics (2025). ISBN 979-8-89176-261-9. https:\/\/aclanthology.org\/2025.gem-1.23\/"},{"key":"588_CR51","unstructured":"Tao, W., Zhou, Y., Wang, Y., Zhang, W., Zhang, H., Cheng, Y.: Magis: Llm-based multi-agent framework for github issue resolution. In: Proceedings of the 38th Conference on Neural Information Processing Systems (NeurIPS). Curran Associates, Inc. (2024)"},{"key":"588_CR52","doi-asserted-by":"crossref","unstructured":"Tian, R., Ye, Y., Qin, Y., Cong, X., Lin, Y., Pan, Y., Wu, Y., Haotian, H., Weichuan, L., Liu, Z., et\u00a0al.: Debugbench: Evaluating debugging capability of large language models. In: Findings of the Association for Computational Linguistics ACL 2024, pp. 4173\u20134198 (2024)","DOI":"10.18653\/v1\/2024.findings-acl.247"},{"key":"588_CR53","doi-asserted-by":"publisher","unstructured":"Vitale, A., Mastropaolo, A., Oliveto, R., Di\u00a0Penta, M., Scalabrino, S.: Optimizing Datasets for Code Summarization: Is Code-Comment Coherence Enough?. In: 2025 IEEE\/ACM 33rd International Conference on Program Comprehension (ICPC), pp. 237\u2013249. Los Alamitos, CA, USA. IEEE Computer Society (2025). https:\/\/doi.org\/10.1109\/ICPC66645.2025.00033. https:\/\/doi.ieeecomputersociety.org\/10.1109\/ICPC66645.2025.00033","DOI":"10.1109\/ICPC66645.2025.00033"},{"key":"588_CR54","unstructured":"Wang, H., Du, X., Yu, W., Chen, Q., Zhu, K., Chu, Z., Yan, L., Guan, Y.: Apollo\u2019s oracle: Retrieval-augmented reasoning in multi-agent debates. arXiv:2312.04854 (2023). https:\/\/arxiv.org\/abs\/2312.04854"},{"issue":"6","key":"588_CR55","doi-asserted-by":"publisher","first-page":"186345","DOI":"10.1007\/S11704-024-40231-1","volume":"18","author":"L Wang","year":"2024","unstructured":"Wang, L., Ma, C., Feng, X., Zhang, Z., Yang, H., Zhang, J., Chen, Z., Tang, J., Chen, X., Lin, Y., Zhao, W.X., Wei, Z., Wen, J.: A survey on large language model based autonomous agents. Frontiers Comput. Sci. 18(6), 186345 (2024a). https:\/\/doi.org\/10.1007\/S11704-024-40231-1","journal-title":"Frontiers Comput. Sci."},{"key":"588_CR56","doi-asserted-by":"publisher","unstructured":"Wang, L., Zhou, Y., Zhuang, H., Li, Q., Cui, D., Zhao, Y., Wang, L.: Unity is strength: Collaborative llm-based agents for code reviewer recommendation. In: Proceedings of the 39th IEEE\/ACM ASE. ASE \u201924, pp. 2235\u20132239. New York, NY, USA. ACM (2024b). ISBN 9798400712487. https:\/\/doi.org\/10.1145\/3691620.3695291","DOI":"10.1145\/3691620.3695291"},{"key":"588_CR57","unstructured":"White, J., Fu, Q., Hays, S., Sandborn, M., Olea, C., Gilbert, H., Elnashar, A., Spencer-Smith, J., Schmidt, D.C.: A prompt pattern catalog to enhance prompt engineering with chatgpt. In: Proceedings of the 30th Conference on Pattern Languages of Programs. PLoP \u201923, USA (2023). The Hillside Group. ISBN 9781941652190"},{"key":"588_CR58","unstructured":"Wu, Q., Bansal, G., Zhang, J., Wu, Y., Li, B., Zhu, E., Jiang, L., Zhang, X., Zhang, S., Liu, J., Awadallah, A.H., White, R.W., Burger, D., Wang, C.: Autogen: Enabling next-gen llm applications via multi-agent conversations. In: Proceedings of the First Conference on Language Modeling (2024). https:\/\/openreview.net\/forum?id=BAakY1hNKS"},{"key":"588_CR59","doi-asserted-by":"publisher","unstructured":"Xia, C.S., Deng, Y., Dunn, S., Zhang, L.: Agentless: Demystifying llm-based software engineering agents. CoRR (2024). https:\/\/doi.org\/10.48550\/ARXIV.2407.01489","DOI":"10.48550\/ARXIV.2407.01489"},{"key":"588_CR60","unstructured":"Yang, C., Wang, X., Lu, Y., Liu, H., Le, Q.V., Zhou, D., Chen, X.: Large language models as optimizers. In: Proceedings of the Twelfth International Conference on Learning Representations (ICLR). Vienna, Austria (2024). https:\/\/openreview.net\/forum?id=Bb4VGOWELI"},{"key":"588_CR61","doi-asserted-by":"publisher","unstructured":"Yao, Z., Schloss, B., Selvaraj, S.: Improving summarization with human edits. In: Bouamor, H., Pino, J., Bali, K. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 2604\u20132620. Singapore. Association for Computational Linguistics (2023). https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.158. https:\/\/aclanthology.org\/2023.emnlp-main.158\/","DOI":"10.18653\/v1\/2023.emnlp-main.158"},{"key":"588_CR62","unstructured":"Zhang, J., Wang, Z., Zhu, H., Liu, J., Lin, Q., Cambria, E.: Mars: A multi-agent framework incorporating socratic guidance for automated prompt optimization (2025). https:\/\/arxiv.org\/abs\/2503.16874"},{"key":"588_CR63","unstructured":"Zhang, L., Ashley, K.D.: Mitigating manipulation and enhancing persuasion: A reflective multi-agent approach for legal argument generation. In: Proceedings of the Workshop on Legally Compliant Intelligent Chatbots at ICAIL 2025. Chicago, IL, USA (2025). https:\/\/arxiv.org\/abs\/2506.02992"},{"key":"588_CR64","doi-asserted-by":"publisher","unstructured":"Zhang, T., Irsan, I.C., Thung, F., Han, D., Lo, D., Jiang, L.: itiger: An automatic issue title generation tool. ESEC\/FSE 2022, pp. 1637\u20131641. New York, NY, USA. Association for Computing Machinery (2022). ISBN 9781450394130. https:\/\/doi.org\/10.1145\/3540250.3558934","DOI":"10.1145\/3540250.3558934"},{"key":"588_CR65","unstructured":"Zhang, Y., Sun, R., Chen, Y., Pfister, T., Zhang, R., Arik, S.O.: Chain of agents: Large language models collaborating on long-context tasks. arXiv:2406.02818 (2024). https:\/\/arxiv.org\/abs\/2406.02818. Preprint. Under review. Work done in part at Google Cloud AI Research"},{"key":"588_CR66","unstructured":"Zhou, H., Wan, X., Sun, R., Palangi, H., Iqbal, S., Vuli\u0107, I., Korhonen, A., Ar\u0131k, S.\u00d6.: Multi-agent design: Optimizing agents with better prompts and topologies. arXiv:2502.02533 (2025a). https:\/\/arxiv.org\/abs\/2502.02533. Preprint submitted to arXiv"},{"key":"588_CR67","doi-asserted-by":"crossref","unstructured":"Zhou, X., Huang, H., Liao, L.: Debate, reflect, and distill: Multi-agent feedback with tree-structured preference optimization for efficient language model enhancement. arXiv:2506.03541 (2025b). https:\/\/arxiv.org\/abs\/2506.03541","DOI":"10.18653\/v1\/2025.findings-acl.475"},{"key":"588_CR68","unstructured":"Zhou, Y., Muresanu, A.I., Han, Z., Paster, K., Pitis, S., Chan, H., Ba, J.: Large language models are human-level prompt engineers. In: Proceedings of the Eleventh International Conference on Learning Representations (ICLR). Kigali, Rwanda (2023). https:\/\/openreview.net\/forum?id=92gvk82DE-"},{"key":"588_CR69","unstructured":"Zhou, Z., Wu, F., Talaei, S., Zhao, H., Meixin, C., Xu, T., Saberi, A., Choi, Y.: When to trust context: Self-reflective debates for context reliability. arXiv:2506.06020 (2025c). https:\/\/arxiv.org\/abs\/2506.06020"}],"container-title":["Automated Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-025-00588-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10515-025-00588-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10515-025-00588-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T05:37:42Z","timestamp":1767937062000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10515-025-00588-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,9]]},"references-count":69,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,12]]}},"alternative-id":["588"],"URL":"https:\/\/doi.org\/10.1007\/s10515-025-00588-4","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-7539426\/v1","asserted-by":"object"}]},"ISSN":["0928-8910","1573-7535"],"issn-type":[{"value":"0928-8910","type":"print"},{"value":"1573-7535","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,9]]},"assertion":[{"value":"4 September 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 December 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the authors.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}},{"value":"All the authors declare that they have no conflict of interest. Furthermore, they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of Interest"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}}],"article-number":"43"}}