{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T15:00:37Z","timestamp":1773414037923,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":52,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,7,10]],"date-time":"2024-07-10T00:00:00Z","timestamp":1720569600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,7,10]]},"DOI":"10.1145\/3663529.3663861","type":"proceedings-article","created":{"date-parts":[[2024,7,10]],"date-time":"2024-07-10T19:43:13Z","timestamp":1720640593000},"page":"417-428","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":16,"title":["X-Lifecycle Learning for Cloud Incident Management using LLMs"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-6713-9240","authenticated-orcid":false,"given":"Drishti","family":"Goel","sequence":"first","affiliation":[{"name":"Microsoft, Bangalore, India"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9089-994X","authenticated-orcid":false,"given":"Fiza","family":"Husain","sequence":"additional","affiliation":[{"name":"Microsoft, Bangalore, India"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-5705-2316","authenticated-orcid":false,"given":"Aditya","family":"Singh","sequence":"additional","affiliation":[{"name":"Microsoft, Bangalore, India"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7275-3296","authenticated-orcid":false,"given":"Supriyo","family":"Ghosh","sequence":"additional","affiliation":[{"name":"Microsoft, Bangalore, India"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6296-0395","authenticated-orcid":false,"given":"Anjaly","family":"Parayil","sequence":"additional","affiliation":[{"name":"Microsoft, Bangalore, India"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0102-8139","authenticated-orcid":false,"given":"Chetan","family":"Bansal","sequence":"additional","affiliation":[{"name":"Microsoft, Redmond, United States"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-1492-0476","authenticated-orcid":false,"given":"Xuchao","family":"Zhang","sequence":"additional","affiliation":[{"name":"Microsoft, Redmond, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2019-213X","authenticated-orcid":false,"given":"Saravan","family":"Rajmohan","sequence":"additional","affiliation":[{"name":"Microsoft, Redmond, United States"}]}],"member":"320","published-online":{"date-parts":[[2024,7,10]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2013.04.001"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3551349.3559555"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE48619.2023.00149"},{"key":"e_1_3_2_1_4_1","volume-title":"13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18)","author":"Alquraan Ahmed","year":"2018","unstructured":"Ahmed Alquraan, Hatem Takruri, Mohammed Alfatafta, and Samer Al-Kiswany. 2018. An analysis of $network-partitioning$ failures in cloud systems. In 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18). 51\u201368."},{"key":"e_1_3_2_1_5_1","volume-title":"Proceedings of the AAAI Conference on Artificial Intelligence. 36","author":"Azad Amar Prakash","year":"2022","unstructured":"Amar Prakash Azad, Supriyo Ghosh, Ajay Gupta, Harshit Kumar, Prateeti Mohapatra, Lena Eckstein, Leonard Posner, and Robert Kern. 2022. Picking Pearl From Seabed: Extracting Artefacts from Noisy Issue Triaging Collaborative Conversations for Hybrid Cloud Services. In Proceedings of the AAAI Conference on Artificial Intelligence. 36, 12440\u201312446."},{"key":"e_1_3_2_1_6_1","unstructured":"Satanjeev Banerjee and Alon Lavie. 2005. METEOR: An Automatic Metric for MT Evaluation with Improved Correlation with Human Judgments. In Proceedings of the ACL Workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation and\/or Summarization Jade Goldstein Alon Lavie Chin-Yew Lin and Clare Voss (Eds.). Association for Computational Linguistics Ann Arbor Michigan. 65\u201372."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3377813.3381353"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2019.00042"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/3324884.3416624"},{"key":"e_1_3_2_1_10_1","volume-title":"Jared Kaplan, Harri Edwards, Yuri Burda, Nicholas Joseph, and Greg Brockman.","author":"Chen Mark","year":"2021","unstructured":"Mark Chen, Jerry Tworek, Heewoo Jun, Qiming Yuan, Henrique Ponde de Oliveira Pinto, Jared Kaplan, Harri Edwards, Yuri Burda, Nicholas Joseph, and Greg Brockman. 2021. Evaluating large language models trained on code. arXiv preprint arXiv:2107.03374."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Yinfang Chen Huaibing Xie Minghua Ma Yu Kang Xin Gao Liu Shi Yunjie Cao Xuedong Gao Hao Fan Ming WEN Jun Zeng Supriyo Ghosh Xuchao Zhang Chaoyun Zhang Qingwei Lin Saravan Rajmohan and Dongmei Zhang. 2023. Empowering Practical Root Cause Analysis by Large Language Models for Cloud Incidents. arXiv preprint arXiv:2305.15778.","DOI":"10.1145\/3627703.3629553"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3368089.3409768"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1"},{"key":"e_1_3_2_1_14_1","volume-title":"Characterizing Service Level Objectives for Cloud Services: Motivation of Short-Term Cache Allocation Performance Modeling. Ph. D. Dissertation","author":"Ding Jianru","unstructured":"Jianru Ding. 2020. Characterizing Service Level Objectives for Cloud Services: Motivation of Short-Term Cache Allocation Performance Modeling. Ph. D. Dissertation. The Ohio State University."},{"key":"e_1_3_2_1_15_1","volume-title":"2019 IEEE International Conference on Autonomic Computing (ICAC). 200\u2013206","author":"Ding Jianru","year":"2019","unstructured":"Jianru Ding, Ruiqi Cao, Indrajeet Saravanan, Nathaniel Morris, and Christopher Stewart. 2019. Characterizing service level objectives for cloud services: Realities and myths. In 2019 IEEE International Conference on Autonomic Computing (ICAC). 200\u2013206."},{"key":"e_1_3_2_1_16_1","unstructured":"Zhiyu Fan Xiang Gao Abhik Roychoudhury and Shin Hwei Tan. 2022. Improving automatically generated code from Codex via Automated Program Repair. arXiv preprint arXiv:2205.10583."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/3540250.3549098"},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the 31st ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering. 1891\u20131902","author":"Ganatra Vaibhav","year":"2023","unstructured":"Vaibhav Ganatra, Anjaly Parayil, Supriyo Ghosh, Yu Kang, Minghua Ma, Chetan Bansal, Suman Nath, and Jonathan Mace. 2023. Detection Is Better Than Cure: A Cloud Incidents Perspective. In Proceedings of the 31st ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering. 1891\u20131902."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3236024.3236030"},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of The Web Conference (WWW).","author":"Ghosh Supriyo","year":"2024","unstructured":"Supriyo Ghosh, Karish Grover, Jimmy Wong, Chetan Bansal, Rakesh Namineni, Mohit Verma, and Saravan Rajmohan. 2024. Dependency Aware Incident Linking in Large Cloud Systems. In Proceedings of The Web Conference (WWW)."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563482"},{"key":"e_1_3_2_1_22_1","volume-title":"Gemini: A Family of Highly Capable Multimodal Models. arXiv preprint arXiv:2312.11805.","author":"Google Gemini Team","year":"2023","unstructured":"Gemini Team Google. 2023. Gemini: A Family of Highly Capable Multimodal Models. arXiv preprint arXiv:2312.11805."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/322033.322044"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3510003.3510203"},{"key":"e_1_3_2_1_25_1","volume-title":"Proceedings of the Sixth ACM Symposium on Cloud Computing. 315\u2013328","author":"Jayathilaka Hiranya","year":"2015","unstructured":"Hiranya Jayathilaka, Chandra Krintz, and Rich Wolski. 2015. Response time service level agreements for cloud-hosted web applications. In Proceedings of the Sixth ACM Symposium on Cloud Computing. 315\u2013328."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3368089.3417054"},{"key":"e_1_3_2_1_27_1","volume-title":"Xpert: Empowering Incident Management with Query Recommendations via Large Language Models. arXiv preprint arXiv:2312.11988.","author":"Jiang Yuxuan","year":"2023","unstructured":"Yuxuan Jiang, Chaoyun Zhang, Shilin He, Zhihao Yang, Minghua Ma, Si Qin, Yu Kang, Yingnong Dang, Saravan Rajmohan, and Qingwei Lin. 2023. Xpert: Empowering Incident Management with Query Recommendations via Large Language Models. arXiv preprint arXiv:2312.11988."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/TBDATA.2019.2921572"},{"key":"e_1_3_2_1_29_1","volume-title":"Proceedings of the AAAI Conference on Artificial Intelligence. 37","author":"Joshi Harshit","year":"2023","unstructured":"Harshit Joshi, Jos\u00e9 Cambronero Sanchez, Sumit Gulwani, Vu Le, Gust Verbruggen, and Ivan Radi\u010dek. 2023. Repair is nearly generation: Multilingual program repair with llms. In Proceedings of the AAAI Conference on Artificial Intelligence. 37, 5131\u20135140."},{"key":"e_1_3_2_1_30_1","volume-title":"Proceedings of the 1st Workshop on Evaluating NLG Evaluation. Association for Computational Linguistics, 28\u201337","author":"Kane Hassan","year":"2020","unstructured":"Hassan Kane, Muhammed Yusuf Kocyigit, Ali Abdalla, Pelkins Ajanoh, and Mohamed Coulibali. 2020. NUBIA: NeUral Based Interchangeability Assessor for Text Generation. In Proceedings of the 1st Workshop on Evaluating NLG Evaluation. Association for Computational Linguistics, 28\u201337."},{"key":"e_1_3_2_1_31_1","volume-title":"ROUGE: A Package for Automatic Evaluation of Summaries. In Text Summarization Branches Out","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin. 2004. ROUGE: A Package for Automatic Evaluation of Summaries. In Text Summarization Branches Out. Association for Computational Linguistics, 74\u201381."},{"key":"e_1_3_2_1_32_1","volume-title":"COLING 2004: Proceedings of the 20th International Conference on Computational Linguistics. COLING, 501\u2013507","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin and Franz Josef Och. 2004. ORANGE: a Method for Evaluating Automatic Evaluation Metrics for Machine Translation. In COLING 2004: Proceedings of the 20th International Conference on Computational Linguistics. COLING, 501\u2013507."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3317550.3321438"},{"key":"e_1_3_2_1_34_1","volume-title":"RoBERTa: A Robustly Optimized BERT Pretraining Approach. ArXiv, abs\/1907.11692","author":"Liu Yinhan","year":"2019","unstructured":"Yinhan Liu, Myle Ott, Naman Goyal, Jingfei Du, Mandar Joshi, Danqi Chen, Omer Levy, Mike Lewis, Luke Zettlemoyer, and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. ArXiv, abs\/1907.11692 (2019), https:\/\/api.semanticscholar.org\/CorpusID:198953378"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623374"},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the 44th International Conference on Software Engineering. 2279\u20132290","author":"Mastropaolo Antonio","year":"2022","unstructured":"Antonio Mastropaolo, Luca Pascarella, and Gabriele Bavota. 2022. Using deep learning to generate complete log statements. In Proceedings of the 44th International Conference on Software Engineering. 2279\u20132290."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/3102980.3102983"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3317550.3321432"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2013.02.011"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2788624"},{"key":"e_1_3_2_1_41_1","volume-title":"Codegen: An open large language model for code with multi-turn program synthesis. arXiv preprint arXiv:2203.13474.","author":"Nijkamp Erik","year":"2022","unstructured":"Erik Nijkamp, Bo Pang, Hiroaki Hayashi, Lifu Tu, Huan Wang, Yingbo Zhou, Silvio Savarese, and Caiming Xiong. 2022. Codegen: An open large language model for code with multi-turn program synthesis. arXiv preprint arXiv:2203.13474."},{"key":"e_1_3_2_1_42_1","unstructured":"OpenAI. 2023. ChatGPT (Feb 13 version) [Large language model]. https:\/\/chat.openai.com"},{"key":"e_1_3_2_1_44_1","unstructured":"Alec Radford Jeff Wu Rewon Child David Luan Dario Amodei and Ilya Sutskever. 2019. Language Models are Unsupervised Multitask Learners. https:\/\/api.semanticscholar.org\/CorpusID:160025533"},{"key":"e_1_3_2_1_45_1","volume-title":"Proceedings of the 46th IEEE\/ACM International Conference on Software Engineering.","author":"Srinivas Pooja","year":"2024","unstructured":"Pooja Srinivas, Fiza Husain, Anjaly Parayil, Ayush Choure, Chetan Bansal, and Saravan Rajmohan. 2024. Intelligent Monitoring Framework for Cloud Services: A Data-Driven Approach. In Proceedings of the 46th IEEE\/ACM International Conference on Software Engineering."},{"key":"e_1_3_2_1_46_1","volume-title":"Chellammal Surianarayanan, and Pethuru Raj Chelliah.","author":"Surianarayanan Chellammal","year":"2019","unstructured":"Chellammal Surianarayanan, Pethuru Raj Chelliah, Chellammal Surianarayanan, and Pethuru Raj Chelliah. 2019. Cloud Monitoring. Essentials of Cloud Computing: A Holistic Perspective, 241\u2013254."},{"key":"e_1_3_2_1_47_1","unstructured":"Junjie Wang Yuchao Huang Chunyang Chen Zhe Liu Song Wang and Qing Wang. 2023. Software testing with large language model: Survey landscape and vision. arXiv preprint arXiv:2307.07221."},{"key":"e_1_3_2_1_48_1","unstructured":"Sean Wolfe. 2018. Amazon\u2019s one hour of downtime on Prime Day may have cost it up to $100 million in lost sales. https:\/\/www.businessinsider.com\/amazon-prime-day-website-issues-cost-it-millions-in-lost-sales-2018-7"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3520312.3534862"},{"key":"e_1_3_2_1_50_1","volume-title":"11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14)","author":"Yuan Ding","year":"2014","unstructured":"Ding Yuan, Yu Luo, Xin Zhuang, Guilherme Renna Rodrigues, Xu Zhao, Yongle Zhang, Pranay U Jain, and Michael Stumm. 2014. Simple Testing Can Prevent Most Critical Failures: An Analysis of Production Failures in Distributed $Data-Intensive$ Systems. In 11th USENIX Symposium on Operating Systems Design and Implementation (OSDI 14). 249\u2013265."},{"key":"e_1_3_2_1_51_1","unstructured":"Tianyi Zhang Varsha Kishore Felix Wu Kilian Weinberger and Yoav Artzi. 2019. BERTScore: Evaluating Text Generation with BERT. arXiv preprint arXiv:1904.09675 04."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"crossref","unstructured":"Xuchao Zhang Supriyo Ghosh Chetan Bansal Rujia Wang Minghua Ma Yu Kang and Saravan Rajmohan. 2024. Automated Root Causing of Cloud Incidents using In-Context Learning with GPT-4. arXiv preprint arXiv:2401.13810.","DOI":"10.1145\/3663529.3663846"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483577"}],"event":{"name":"FSE '24: 32nd ACM International Conference on the Foundations of Software Engineering","location":"Porto de Galinhas Brazil","acronym":"FSE '24","sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"]},"container-title":["Companion Proceedings of the 32nd ACM International Conference on the Foundations of Software Engineering"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3663529.3663861","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3663529.3663861","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T23:44:22Z","timestamp":1750290262000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3663529.3663861"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,10]]},"references-count":52,"alternative-id":["10.1145\/3663529.3663861","10.1145\/3663529"],"URL":"https:\/\/doi.org\/10.1145\/3663529.3663861","relation":{},"subject":[],"published":{"date-parts":[[2024,7,10]]},"assertion":[{"value":"2024-07-10","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}