{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T21:29:17Z","timestamp":1771018157344,"version":"3.50.1"},"reference-count":77,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Ministry of Education, Singapore under its Academic Research Fund Tier 2","award":["T2EP20222-0037"],"award-info":[{"award-number":["T2EP20222-0037"]}]},{"name":"Key R&#x0026;D Program of Zhejiang","award":["2025C01083"],"award-info":[{"award-number":["2025C01083"]}]},{"DOI":"10.13039\/100018735","name":"Ant Group","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100018735","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IIEEE Trans. Software Eng."],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1109\/tse.2025.3619112","type":"journal-article","created":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T17:53:23Z","timestamp":1760032403000},"page":"411-427","source":"Crossref","is-referenced-by-count":0,"title":["Efficient Function Orchestration for Large Language Models"],"prefix":"10.1109","volume":"52","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-6662-9020","authenticated-orcid":false,"given":"Xiaoxia","family":"Liu","sequence":"first","affiliation":[{"name":"Zhejiang University, Zhejiang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5799-5876","authenticated-orcid":false,"given":"Peng","family":"Di","sequence":"additional","affiliation":[{"name":"Ant Group, Zhejiang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9576-100X","authenticated-orcid":false,"given":"Cong","family":"Li","sequence":"additional","affiliation":[{"name":"Zhejiang University, Zhejiang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3545-1392","authenticated-orcid":false,"given":"Jun","family":"Sun","sequence":"additional","affiliation":[{"name":"Singapore Management University, Singapore"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7113-7635","authenticated-orcid":false,"given":"Jingyi","family":"Wang","sequence":"additional","affiliation":[{"name":"Zhejiang University, Zhejiang, China"}]}],"member":"263","reference":[{"key":"ref1","article-title":"GPT-4 technical report","author":"Achiam","year":"2023"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"320","DOI":"10.18653\/v1\/2022.acl-long.26","article-title":"GLM: General language model pretraining with autoregressive blank infilling","volume-title":"Proc. 60th Annu. Meeting Assoc. Comput. Linguistics (Volume 1: Long Papers)","author":"Du","year":"2022"},{"key":"ref3","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"ref4","article-title":"AutoGPT","year":"2023"},{"key":"ref5","article-title":"SWE-agent: Agent-computer interfaces enable automated software engineering","volume-title":"Proc. 38th Int. Conf. Neural Inf. Process. Syst.","author":"Yang","year":"2024"},{"key":"ref6","article-title":"Agentless: Demystifying LLM-based software engineering agents","author":"Xia","year":"2024"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-023-06924-6"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-023-06747-5"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2024.3368208"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2024.3472476"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-023-00691-9"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1038\/s44286-023-00002-4"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1038\/s41592-024-02305-7"},{"key":"ref14","article-title":"ReAct: Synergizing reasoning and acting in language models","author":"Yao","year":"2022"},{"key":"ref15","article-title":"Function calling and other API updates","year":"2023"},{"key":"ref16","article-title":"ChatGLM3","year":"2023"},{"key":"ref17","article-title":"Llama3","year":"2024"},{"key":"ref18","article-title":"LangChain","author":"Chase","year":"2022"},{"key":"ref19","article-title":"Glaive function calling","year":"2023"},{"key":"ref20","article-title":"Gorilla: Large language model connected with massive APIs","volume-title":"Proc. 38th Int. Conf. Neural Inf. Process. Syst.","author":"Patil","year":"2024"},{"key":"ref21","article-title":"ToolLLM: Facilitating large language models to master 16000+ real-world APIs","author":"Qin","year":"2023"},{"key":"ref22","first-page":"35549","article-title":"FlashAttention-2: Faster attention with better parallelism and work partitioning","volume-title":"Proc. Int. Conf. Learn. Representations (ICLR)","author":"Dao","year":"2024"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3600006.3613165"},{"key":"ref24","article-title":"Break the sequential dependency of LLM inference using lookahead decoding","volume-title":"Proc. 41st Int. Conf. Mach. Learn.","author":"Fu","year":"2024"},{"key":"ref25","article-title":"Efficiently programming large language models using SGLang","author":"Zheng","year":"2023"},{"key":"ref26","article-title":"New models and developer products announced at DevDay","year":"2023"},{"key":"ref27","article-title":"Pull request: Add parallel function calling","year":"2023"},{"key":"ref28","article-title":"Parallel function calling","year":"2024"},{"key":"ref29","article-title":"Introduction to function calling","year":"2024"},{"key":"ref30","article-title":"An LLM-tool compiler for fused parallel function calling","author":"Singh","year":"2024"},{"key":"ref31","article-title":"An LLM compiler for parallel function calling","volume-title":"Proc. 41st Int. Conf. Mach. Learn.","author":"Kim","year":"2024"},{"key":"ref32","article-title":"Function calling","year":"2024"},{"key":"ref33","article-title":"AIOS: LLM agent operating system","author":"Mei","year":"2024"},{"key":"ref34","first-page":"50208","article-title":"Executable code actions elicit better LLM agents","volume-title":"Proc. 41st Int. Conf. Mach. Learn.","volume":"235","author":"Wang","year":"2024"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651029"},{"key":"ref36","article-title":"Demonstrating large language models on robots","author":"Zeng","year":"2023","journal-title":"Robot.: Sci. Syst. XIX"},{"key":"ref37","article-title":"DAG-plan: Generating directed acyclic dependency graphs for dual-arm cooperative planning","author":"Gao","year":"2024"},{"key":"ref38","volume-title":"Compilers: Principles, Techniques, and Tools","author":"Aho","year":"2006"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/324133.324234"},{"key":"ref40","article-title":"Llama.cpp"},{"key":"ref41","article-title":"MLC-LLM"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3694715.3695964"},{"key":"ref43","article-title":"PowerInfer-2: Fast large language model inference on a smartphone","author":"Xue","year":"2024"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.678"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1002\/asi.24750"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1259"},{"key":"ref47","article-title":"Developing with Asyncio","year":"2024"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/3650212.3680323"},{"key":"ref49","doi-asserted-by":"crossref","DOI":"10.1145\/3622781.3674171","article-title":"The mutators reloaded: Fuzzing compilers with large language model generated mutation operators","volume-title":"Proc. Int. Conf. Archit. Support Program. Lang. Operating Syst. (ASPLOS)","author":"Ou","year":"2024"},{"key":"ref50","article-title":"Beyond the imitation game: Quantifying and extrapolating the capabilities of language models","author":"Srivastava","year":"2022"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/1465482.1465560"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"ref53","first-page":"649","article-title":"Character-level convolutional networks for text classification","volume-title":"Proc. 29th Int. Conf. Neural Inf. Process. Syst. - vol. 1","volume":"28","author":"Zhang","year":"2015"},{"key":"ref54","article-title":"Functionary","year":"2023"},{"key":"ref55","article-title":"The Berkeley function calling leaderboard (BFCL): From tool use to agentic evaluation of large language models","volume-title":"Proc. 42nd Int. Conf. Mach. Learn. (ICML)","author":"Patil","year":"2025"},{"key":"ref56","article-title":"GLM-4","year":"2024"},{"key":"ref57","article-title":"Prompting frameworks for large language models: A survey","author":"Liu","year":"2023"},{"key":"ref58","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Wei","year":"2022"},{"key":"ref59","article-title":"Tree of thoughts: Deliberate problem solving with large language models","volume-title":"Proc. 37th Int. Conf. Neural Inf. Process. Syst. (NeurIPS)","author":"Yao","year":"2023"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i16.29720"},{"key":"ref61","article-title":"Retrieval-augmented generation for knowledge-intensive NLP tasks","volume-title":"Proc. 34th Int. Conf. Neural Inf. Process. Syst. (NeurIPS)","author":"Lewis","year":"2020"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1145\/3591300"},{"key":"ref63","article-title":"Semantic-kernel","year":"2023"},{"key":"ref64","article-title":"SuperAGI","year":"2023"},{"key":"ref65","article-title":"NeMo-Guardrails","year":"2023"},{"key":"ref66","article-title":"Efficient large language models: A survey","author":"Wan","year":"2024","journal-title":"Trans. Mach. Learn. Res."},{"key":"ref67","article-title":"Efficient streaming language models with attention sinks","author":"Xiao","year":"2024"},{"key":"ref68","first-page":"13358","article-title":"LLMLingua: Compressing prompts for accelerated inference of large language models","volume-title":"Proc. Conf. Empirical Methods Nat. Lang. Process.","author":"Jiang","year":"2023"},{"key":"ref69","article-title":"Mamba: Linear-time sequence modeling with selective state spaces","volume-title":"Proc. 1st Conf. Lang. Model.","author":"Gu","year":"2024"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1137\/0117039"},{"key":"ref71","first-page":"833","article-title":"BWoS: Formally verified block-based work stealing for parallel processing","volume-title":"Proc. 17th USENIX Symp. Operating Syst. Des. Implementation (OSDI 23)","author":"Wang","year":"2023"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1145\/378420.378792"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.1985.232189"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4615-5535-3"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2008.5214359"},{"key":"ref76","first-page":"2","article-title":"Timegraph: GPU scheduling for real-time multi-tasking environments","volume-title":"Proc. USENIX Conf. USENIX Annu. Tech. Conf. (USENIXATC)","author":"Kato","year":"2011"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC\/SmartCity\/DSS.2019.00137"}],"container-title":["IEEE Transactions on Software Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/32\/11395383\/11197584.pdf?arnumber=11197584","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T20:49:46Z","timestamp":1771015786000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11197584\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2]]},"references-count":77,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/tse.2025.3619112","relation":{},"ISSN":["0098-5589","1939-3520","2326-3881"],"issn-type":[{"value":"0098-5589","type":"print"},{"value":"1939-3520","type":"electronic"},{"value":"2326-3881","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2]]}}}