{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T21:21:35Z","timestamp":1775856095281,"version":"3.50.1"},"reference-count":115,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"9","license":[{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62372232"],"award-info":[{"award-number":["62372232"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["NG2023005"],"award-info":[{"award-number":["NG2023005"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Collaborative Innovation Center of Novel Software Technology and Industrialization"},{"name":"Postgraduate Research &amp; Practice Innovation Program of Jiangsu Province","award":["KYCX23_0396"],"award-info":[{"award-number":["KYCX23_0396"]}]},{"name":"Short-term Visiting Program of Nanjing University of Aeronautics and Astronautics for Ph.D. Students Abroad","award":["240501DF16"],"award-info":[{"award-number":["240501DF16"]}]},{"name":"State Key Laboratory of Novel Software Technology, Nanjing University","award":["KFKT2022A03"],"award-info":[{"award-number":["KFKT2022A03"]}]},{"name":"State Key Laboratory of Novel Software Technology, Nanjing University","award":["KFKT2023A04"],"award-info":[{"award-number":["KFKT2023A04"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IIEEE Trans. Software Eng."],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1109\/tse.2024.3440503","type":"journal-article","created":{"date-parts":[[2024,8,12]],"date-time":"2024-08-12T17:30:02Z","timestamp":1723483802000},"page":"2437-2457","source":"Crossref","is-referenced-by-count":38,"title":["Chain-of-Thought in Neural Code Generation: From and for Lightweight Language Models"],"prefix":"10.1109","volume":"50","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3374-6680","authenticated-orcid":false,"given":"Guang","family":"Yang","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3723-7584","authenticated-orcid":false,"given":"Yu","family":"Zhou","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1180-3891","authenticated-orcid":false,"given":"Xiang","family":"Chen","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Nantong University, Nantong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-6271-746X","authenticated-orcid":false,"given":"Xiangyu","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5760-5188","authenticated-orcid":false,"given":"Terry Yue","family":"Zhuo","sequence":"additional","affiliation":[{"name":"Monash University, Melbourne, VIC, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5993-1665","authenticated-orcid":false,"given":"Taolue","family":"Chen","sequence":"additional","affiliation":[{"name":"School of Computing and Mathematical Sciences, Birkbeck, University of London, London, U.K."}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3368089.3417058"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1126\/science.abq1158"},{"key":"ref3","article-title":"AI-assisted coding: Experiments with GPT-4","author":"Poldrack","year":"2023"},{"key":"ref4","article-title":"Is your code generated by chatGPT really correct? Rigorous evaluation of large language models for code generation","author":"Liu","year":"2023"},{"key":"ref5","article-title":"Challenges and applications of large language models","author":"Kaddour","year":"2023"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.metrad.2023.100022"},{"key":"ref7","article-title":"Specializing smaller language models towards multi-step reasoning","author":"Fu","year":"2023"},{"key":"ref8","article-title":"Improving chatGPT prompt for code generation","author":"Liu","year":"2023"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE48619.2023.00205"},{"key":"ref10","article-title":"A study on prompt design, advantages and limitations of chatGPT for deep learning program repair","author":"Cao","year":"2023"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-55642-5_4"},{"key":"ref12","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","volume":"35","author":"Wei","year":"2022"},{"key":"ref13","article-title":"Self-planning code generation with large language model","author":"Jiang","year":"2023"},{"key":"ref14","article-title":"Structured chain-of-thought prompting for code generation","author":"Li","year":"2023"},{"key":"ref15","article-title":"Large language models are state-of-the-art evaluators of code generation","author":"Zhuo","year":"2023"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.67"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.294"},{"key":"ref18","first-page":"22199","article-title":"Large language models are zero-shot reasoners","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","volume":"35","author":"Kojima","year":"2022"},{"key":"ref19","article-title":"CodeGen: An open large language model for code with multi-turn program synthesis","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Nijkamp","year":"2022"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.nlposs-1.25"},{"key":"ref21","first-page":"12360","article-title":"Root mean square layer normalization","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"32","author":"Zhang","year":"2019"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.298"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref24","article-title":"LoRA: Low-rank adaptation of large language models","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Hu","year":"2021"},{"key":"ref25","article-title":"Evaluating large language models trained on code","author":"Chen","year":"2021"},{"key":"ref26","article-title":"GLM-130B: An open bilingual pre-trained model","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Zeng","year":"2022"},{"key":"ref27","article-title":"Code Llama: Open foundation models for code","author":"Rozi\u00e8re","year":"2023"},{"key":"ref28","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3505243"},{"key":"ref30","article-title":"RoFormer: Enhanced transformer with rotary position embedding","author":"Su","year":"2021"},{"key":"ref31","first-page":"16344","article-title":"FlashAttention: Fast and memory-efficient exact attention with IO-awareness","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Dao","year":"2022"},{"key":"ref32","article-title":"Large language models for software engineering: A systematic literature review","author":"Hou","year":"2023"},{"key":"ref33","article-title":"Textbooks are all you need","author":"Gunasekar","year":"2023"},{"key":"ref34","article-title":"Bootstrapping code-text pretrained language model to detect inconsistency between code and comment","author":"Dau","year":"2024"},{"key":"ref35","article-title":"A survey on large language model based autonomous agents","author":"Wang","year":"2023"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1163\/2214-8647_dnp_e204640"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.243"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.576"},{"key":"ref39","article-title":"AVATAR: A parallel corpus for Java-Python program translation","author":"Ahmad","year":"2021"},{"key":"ref40","article-title":"StarCoder: May the source be with you!","author":"Li","year":"2023"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.68"},{"key":"ref42","article-title":"Unifying the perspectives of NLP and software engineering: A survey on language models for code","author":"Zhang","year":"2023"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2022.111577"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-023-10372-1"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107858"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/SANER53432.2022.00052"},{"key":"ref47","doi-asserted-by":"crossref","DOI":"10.2139\/ssrn.4623115","article-title":"Assessing and improving syntactic adversarial robustness of pre-trained models for code translation","author":"Yang","year":"2023"},{"key":"ref48","first-page":"311","article-title":"BLEU: A method for automatic evaluation of machine translation","volume-title":"Proc. 40th Annu. Meeting Assoc. Comput. Linguistics","author":"Papineni","year":"2002"},{"key":"ref49","first-page":"65","article-title":"METEOR: An automatic metric for MT evaluation with improved correlation with human judgments","volume-title":"Proc. ACL Workshop Intrinsic Extrinsic Eval. Meas. Mach. Transl. Summarization","author":"Banerjee","year":"2005"},{"key":"ref50","first-page":"74","article-title":"ROUGE: A package for automatic evaluation of summaries,\u201d in Text summarization Branches Out","volume-title":"Proc. ACL-04 Workshop, Barcelona, Spain","author":"Lin","year":"2004"},{"key":"ref51","article-title":"InternLM: A multilingual language model with progressively enhanced capabilities","author":"Team","year":"2023"},{"key":"ref52","article-title":"Gemini: A family of highly capable multimodal models","author":"Team","year":"2023"},{"key":"ref53","article-title":"GPT-4 technical report","author":"Achiam","year":"2023"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.139"},{"key":"ref55","article-title":"GraphCodeBERT: Pre-training code representations with data flow","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Guo","year":"2020"},{"key":"ref56","article-title":"CodeXGLUE: A machine learning benchmark dataset for code understanding and generation","volume-title":"Proc. 35th Conf. Neural Inf. Process. Syst. Datasets Benchmarks Track (Round 1)","author":"Lu","year":"2021"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.211"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.685"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1145\/3540250.3549162"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599790"},{"key":"ref61","first-page":"349","article-title":"Retrieve and refine: Exemplar-based neural comment generation","volume-title":"Proc. 35th IEEE\/ACM Int. Conf. Automated Softw. Eng. (ASE)","author":"Wei","year":"2020"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2023.3292399"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE48619.2023.00179"},{"issue":"1","key":"ref64","first-page":"87","article-title":"On the interpretation of \u03c72 from contingency tables, and the calculation of P","volume-title":"J. R. Statist. Soc.","volume":"85","author":"Fisher","year":"1922"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1037\/h0031619"},{"key":"ref66","article-title":"DeepSeek-coder: When the large language model meets programming\u2013The rise of code intelligence","author":"Guo","year":"2024"},{"key":"ref67","article-title":"WizardCoder: Empowering code large language models with Evol-Instruct","author":"Luo","year":"2023"},{"key":"ref68","article-title":"Improving code generation by training with natural language feedback","author":"Chen","year":"2023"},{"key":"ref69","article-title":"StepCoder: Improve code generation with reinforcement learning from compiler feedback","author":"Dou","year":"2024"},{"key":"ref70","first-page":"23826","article-title":"InterCode: Standardizing and benchmarking interactive coding with execution feedback","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"36","author":"Yang","year":"2024"},{"key":"ref71","article-title":"OpenCodeInterpreter: Integrating code generation with execution and refinement","author":"Zheng","year":"2024"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.22"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00502"},{"key":"ref74","volume-title":"Text generation strategies","author":"Face","year":"2023"},{"key":"ref75","first-page":"21548","article-title":"A contrastive framework for neural text generation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Su","year":"2022"},{"key":"ref76","article-title":"PEFT: State-of-the-art parameter-efficient fine-tuning methods","author":"Mangrulkar","year":"2022"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acllong.353"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1016\/j.aiopen.2023.08.012"},{"key":"ref79","article-title":"Alpaca-LoRA: Instruct-tune LLaMA on consumer hardware","year":"2023"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1145\/3401026"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/SANER53432.2022.00075"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2017.8115626"},{"key":"ref83","first-page":"3053","article-title":"Inducing tree-substitution grammars","volume":"11","author":"Cohn","year":"2010","journal-title":"J. Mach. Learn. Res."},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1145\/2635868.2635901"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1145\/1836089.1836091"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.411"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1145\/2491411.2491458"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1145\/2594291.2594321"},{"key":"ref89","first-page":"1601","article-title":"The recurrent temporal restricted Noltzmann machine","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"21","author":"Sutskever","year":"2008"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/FPT.2016.7929190"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33017055"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1195"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1145\/3238147.3238206"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1078"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-1041"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE43902.2021.00041"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/CONIT51480.2021.9498268"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/ISSRE52982.2021.00042"},{"key":"ref99","article-title":"Training and evaluating a Jupyter Notebook data science assistant","author":"Chandel","year":"2022"},{"key":"ref100","article-title":"InCoder: A generative model for code infilling and synthesis","volume-title":"11th Int. Conf. Learn. Representations","author":"Fried","year":"2022"},{"key":"ref101","article-title":"CodeGen2: Lessons for training LLMs on programming and natural languages","author":"Nijkamp","year":"2023"},{"key":"ref102","article-title":"OctoPack: Instruction tuning code large language models","author":"Muennighoff","year":"2023"},{"key":"ref103","article-title":"Emergent abilities of large language models","volume-title":"Trans. Mach. Learn. Res.","author":"Wei","year":"2022"},{"key":"ref104","article-title":"Rethinking with retrieval: Faithful large language model inference","author":"He","year":"2022"},{"key":"ref105","article-title":"Self-consistency improves chain of thought reasoning in language models","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Wang","year":"2022"},{"key":"ref106","article-title":"Selection-inference: Exploiting large language models for interpretable logical reasoning","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Creswell","year":"2022"},{"key":"ref107","article-title":"Least-to-most prompting enables complex reasoning in large language models","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Zhou","year":"2022"},{"key":"ref108","article-title":"Large language models are reasoning teachers","author":"Ho","year":"2022"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.150"},{"key":"ref110","article-title":"Distilling multi-step reasoning capabilities of large language models into smaller models via semantic decompositions","author":"Shridhar","year":"2022"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-020-09938-y"},{"key":"ref112","article-title":"Evaluating multi-agent coordination abilities in large language models","author":"Agashe","year":"2023"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i16.29710"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01750"},{"key":"ref115","article-title":"AgentCoder: Multi-agent-based code generation with iterative testing and optimisation","author":"Huang","year":"2023"}],"container-title":["IEEE Transactions on Software Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/32\/10683742\/10634302.pdf?arnumber=10634302","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,20]],"date-time":"2024-09-20T06:27:29Z","timestamp":1726813649000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10634302\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9]]},"references-count":115,"journal-issue":{"issue":"9"},"URL":"https:\/\/doi.org\/10.1109\/tse.2024.3440503","relation":{},"ISSN":["0098-5589","1939-3520","2326-3881"],"issn-type":[{"value":"0098-5589","type":"print"},{"value":"1939-3520","type":"electronic"},{"value":"2326-3881","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9]]}}}