{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T05:11:40Z","timestamp":1780636300858,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":56,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,3]]},"DOI":"10.1145\/3711896.3737013","type":"proceedings-article","created":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T13:30:13Z","timestamp":1754055013000},"page":"1128-1138","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Knowledge-Aligned Domain Shift Tuning for Efficient Adaptation in Large Language Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0746-9624","authenticated-orcid":false,"given":"Noriaki","family":"Kawamae","sequence":"first","affiliation":[{"name":"NTT Comware, Tokyo, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2025,8,3]]},"reference":[{"key":"e_1_3_2_2_1_1","first-page":"7319","article-title":"Intrinsic Dimensionality Explains the Effectiveness of Language Model Fine-Tuning","author":"Aghajanyan Armen","year":"2021","unstructured":"Armen Aghajanyan, Sonal Gupta, and Luke Zettlemoyer. 2021. Intrinsic Dimensionality Explains the Effectiveness of Language Model Fine-Tuning. In ACL\/IJCNLPP. 7319-7328.","journal-title":"ACL\/IJCNLPP."},{"key":"e_1_3_2_2_2_1","unstructured":"AI@Meta. 2024. Llama 3 Model Card. (2024)."},{"key":"e_1_3_2_2_3_1","volume-title":"A Neural Probabilistic Language Model. J. Mach. Learn. Res. 3 (Mar","author":"Bengio Yoshua","year":"2003","unstructured":"Yoshua Bengio, R\u00e9jean Ducharme, Pascal Vincent, and Christian Janvin. 2003. A Neural Probabilistic Language Model. J. Mach. Learn. Res. 3 (Mar 2003), 1137-1155."},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553380"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.5555\/944919.944937"},{"key":"e_1_3_2_2_6_1","volume-title":"Jared Kaplan","author":"Brown Tom","year":"2020","unstructured":"Tom Brown, Benjamin Mann, Nick Ryder, Melanie Subbiah, and et al Jared Kaplan. 2020. Language Models are Few-Shot Learners. In NeurIPS."},{"key":"e_1_3_2_2_7_1","volume-title":"Buehler","author":"Buehler Eric L.","year":"2024","unstructured":"Eric L. Buehler and Markus J. Buehler. 2024. X-LoRA: Mixture of Low-Rank Adapter Experts, a Flexible Framework for Large Language Models with Applications in Protein Mechanics and Molecular Design. CoRR abs\/2402.07148 (2024)."},{"key":"e_1_3_2_2_8_1","volume-title":"AdaPrompt: Adaptive Model Training for Prompt-based NLP. CoRR abs\/2202.04824","author":"Chen Yulong","year":"2022","unstructured":"Yulong Chen, Yang Liu, Li Dong, Shuohang Wang, Chenguang Zhu, Michael Zeng, and Yue Zhang. 2022. AdaPrompt: Adaptive Model Training for Prompt-based NLP. CoRR abs\/2202.04824 (2022)."},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"crossref","unstructured":"Tim Dettmers Artidoro Pagnoni Ari Holtzman and Luke Zettlemoyer. 2023. QLoRA: Efficient Finetuning of Quantized LLMs. In NeurIPS.","DOI":"10.52202\/075280-0441"},{"key":"e_1_3_2_2_10_1","volume-title":"Smith","author":"Dodge Jesse","year":"2020","unstructured":"Jesse Dodge, Gabriel Ilharco, Roy Schwartz, Ali Farhadi, Hannaneh Hajishirzi, and Noah A. Smith. 2020. Fine-Tuning Pretrained Language Models: Weight Initializations, Data Orders, and Early Stopping. CoRR abs\/2002.06305 (2020)."},{"key":"e_1_3_2_2_11_1","first-page":"13042","article-title":"Unified Language Model Pre- training for Natural Language Understanding and Generation","author":"Dong Li","year":"2019","unstructured":"Li Dong, Nan Yang, Wenhui Wang, Furu Wei, Xiaodong Liu, Yu Wang, Jianfeng Gao, Ming Zhou, and Hsiao-Wuen Hon. 2019. Unified Language Model Pre- training for Natural Language Understanding and Generation. In NeurIPS. 13042-13054.","journal-title":"NeurIPS."},{"key":"e_1_3_2_2_12_1","unstructured":"Alexey Dosovitskiy Lucas Beyer and etc. 2021. An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale. In ICLR."},{"key":"e_1_3_2_2_13_1","article-title":"Switch Transformers: Scaling to Trillion Parameter Models with Simple and Efficient Sparsity","volume":"23","author":"Fedus William","year":"2022","unstructured":"William Fedus, Barret Zoph, and Noam Shazeer. 2022. Switch Transformers: Scaling to Trillion Parameter Models with Simple and Efficient Sparsity. J. Mach. Learn. Res. 23 (2022), 120:1-120:39.","journal-title":"J. Mach. Learn. Res."},{"key":"e_1_3_2_2_14_1","unstructured":"Jonathan Frankle and Michael Carbin. 2019. The Lottery Ticket Hypothesis: Finding Sparse Trainable Neural Networks. In ICLR."},{"key":"e_1_3_2_2_15_1","first-page":"8342","article-title":"Don't stop pretraining: adapt language models to domains and tasks","author":"Gururangan Suchin","year":"2020","unstructured":"Suchin Gururangan and et al. 2020. Don't stop pretraining: adapt language models to domains and tasks. In ACL. 8342-8360.","journal-title":"ACL."},{"key":"e_1_3_2_2_16_1","first-page":"770","article-title":"Deep Residual Learning for Image Recognition","author":"He Kaiming","year":"2016","unstructured":"Kaiming He, Xiangyu Zhang, Shaoqing Ren, and Jian Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR. 770-778.","journal-title":"CVPR."},{"key":"e_1_3_2_2_17_1","unstructured":"Neil Houlsby Andrei Giurgiu Stanislaw Jastrzebski Bruna Morrone Quentin de Laroussilhe Andrea Gesmundo Mona Attariyan and Sylvain Gelly. 2019. Parameter-Efficient Transfer Learning for NLPParameter-Efficient Transfer Learning for NLP. 2790-2799."},{"key":"e_1_3_2_2_18_1","unstructured":"Edward J. Hu Yelong Shen Phillip Wallis Zeyuan Allen-Zhu Yuanzhi Li Shean Wang Lu Wang and Weizhu Chen. 2022. LoRA: Low-Rank Adaptation of Large Language Models. In ICLR. OpenReview.net."},{"key":"e_1_3_2_2_19_1","first-page":"2579","article-title":"UDALM: Unsupervised Domain Adaptation through Language Modeling","author":"Karouzos Constantinos","year":"2021","unstructured":"Constantinos Karouzos, Georgios Paraskevopoulos, and Alexandros Potamianos. 2021. UDALM: Unsupervised Domain Adaptation through Language Modeling. In ACL. 2579-2590.","journal-title":"ACL."},{"key":"e_1_3_2_2_20_1","first-page":"315","article-title":"Topic Chronicle Forest for Topic Discovery and Tracking","author":"Kawamae Noriaki","year":"2018","unstructured":"Noriaki Kawamae. 2018. Topic Chronicle Forest for Topic Discovery and Tracking. In WSDM. 315-323.","journal-title":"WSDM."},{"key":"e_1_3_2_2_21_1","first-page":"2900","article-title":"Topic Structure-Aware Neural Language Model: Unified language model that maintains word and topic ordering by their embedded representations","author":"Kawamae Noriaki","year":"2019","unstructured":"Noriaki Kawamae. 2019. Topic Structure-Aware Neural Language Model: Unified language model that maintains word and topic ordering by their embedded representations. In WWW. 2900-2906.","journal-title":"WWW."},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3486622.3493968"},{"key":"e_1_3_2_2_23_1","first-page":"10177","article-title":"Adapting a Language Model While Preserving its General Knowledge","author":"Ke Zixuan","year":"2022","unstructured":"Zixuan Ke, Yijia Shao, Haowei Lin, Hu Xu, Lei Shu, and Bing Liu. 2022. Adapting a Language Model While Preserving its General Knowledge. In EMNLP. 10177-10188.","journal-title":"EMNLP."},{"key":"e_1_3_2_2_24_1","volume-title":"Jacob Mitchell Springer, and Aditi Raghunathann","author":"Kotha Suhas","year":"2024","unstructured":"Suhas Kotha, Jacob Mitchell Springer, and Aditi Raghunathann. 2024. Understanding Catastrophic Forgetting in Language Models via Implicit Inferences. In ICLR."},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.3115\/1626355.1626389"},{"key":"e_1_3_2_2_26_1","unstructured":"Dmitry Lepikhin HyoukJoong Lee Yuanzhong Xu Dehao Chen Orhan Firat Yanping Huang Maxim Krikun Noam Shazeer and Zhifeng Chen. 2021. GShard: Scaling Giant Models with Conditional Computation and Automatic Sharding. In ICLR. OpenReview.net."},{"key":"e_1_3_2_2_27_1","first-page":"3045","article-title":"The Power of Scale for Parameter-Efficient Prompt Tuning","author":"Lester Brian","year":"2021","unstructured":"Brian Lester, Rami Al-Rfou, and Noah Constant. 2021. The Power of Scale for Parameter-Efficient Prompt Tuning. In EMNLP. 3045-3059.","journal-title":"EMNLP."},{"key":"e_1_3_2_2_28_1","unstructured":"Chunyuan Li Heerad Farkhoor Rosanne Liu and Jason Yosinski. 2018. Measuring the Intrinsic Dimension of Objective Landscapes. In ICLR."},{"key":"e_1_3_2_2_29_1","first-page":"4582","article-title":"Prefix-Tuning","author":"Li Xiang Lisa","year":"2021","unstructured":"Xiang Lisa Li and Percy Liang. 2021. Prefix-Tuning: Optimizing Continuous Prompts for Generation. In ACL\/IJCNLP. 4582-4597.","journal-title":"Optimizing Continuous Prompts for Generation. In ACL\/IJCNLP."},{"key":"e_1_3_2_2_30_1","first-page":"25","article-title":"Rouge: a package for automatic evaluation of summaries","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin. 2004. Rouge: a package for automatic evaluation of summaries. In ACL-workshop. 25-26.","journal-title":"ACL-workshop."},{"key":"e_1_3_2_2_31_1","volume-title":"Speciality vs Generality: An Empirical Study on Catastrophic Forgetting in Fine-tuning Foundation Models. CoRR abs\/2309.06256","author":"Lin Yong","year":"2023","unstructured":"Yong Lin, Lu Tan, Hangyu Lin, Zeming Zheng, Renjie Pi, Jipeng Zhang, Shizhe Diao, Haoxiang Wang, Han Zhao, Yuan Yao, and Tong Zhang. 2023. Speciality vs Generality: An Empirical Study on Catastrophic Forgetting in Fine-tuning Foundation Models. CoRR abs\/2309.06256 (2023)."},{"key":"e_1_3_2_2_32_1","unstructured":"Haokun Liu Derek Tam Muqeeth Mohammed Jay Mohta Tenghao Huang Mohit Bansal and Colin Raffel. 2022. Few-Shot Parameter-Efficient Fine-Tuning is Better and Cheaper than In-Context Learning. In NeurIPS."},{"key":"e_1_3_2_2_33_1","unstructured":"Liyuan Liu Young Jin Kim Shuohang Wang Chen Liang Yelong Shen Hao Cheng Xiaodong Liu Masahiro Tanaka Xiaoxia Wu Wenxiang Hu Vishrav Chaudhary Zeqi Lin Chengruidong Zhang Jilong Xue Hany Awadalla Jianfeng Gao and Weizhu Chen. 2025. GRIN: GRadient-INformed MoE. CoRR abs\/2409.12136 (2025)."},{"key":"e_1_3_2_2_34_1","volume-title":"CoRR abs\/2103.10385","author":"Liu Xiao","year":"2021","unstructured":"Xiao Liu, Yanan Zheng, Zhengxiao Du, Ming Ding, Yujie Qian, Zhilin Yang, and Jie Tang. 2021. GPT Understands, Too. CoRR abs\/2103.10385 (2021)."},{"key":"e_1_3_2_2_35_1","volume-title":"PEFT: State-of-the-art Parameter-Efficient Fine-Tuning methods. https:\/\/github.com\/huggingface\/peft.","author":"Mangrulkar Sourab","year":"2022","unstructured":"Sourab Mangrulkar, Sylvain Gugger, Lysandre Debut, Younes Belkada, Sayak Paul, and Benjamin Bossan. 2022. PEFT: State-of-the-art Parameter-Efficient Fine-Tuning methods. https:\/\/github.com\/huggingface\/peft."},{"key":"e_1_3_2_2_36_1","volume-title":"Oyvind Tafjord, Nathan Lambert, Yuling Gu, Shane Arora, Akshita Bhagia, Dustin Schwenk, David Wadden, Alexander Wettig, Binyuan Hui, Tim Dettmers, Douwe Kiela, Ali Farhadi, and et al.","author":"Muennighoff Niklas","year":"2025","unstructured":"Niklas Muennighoff, Luca Soldaini, Dirk Groeneveld, Kyle Lo, Jacob Morrison, Sewon Min, Weijia Shi, Evan Pete Walsh, Oyvind Tafjord, Nathan Lambert, Yuling Gu, Shane Arora, Akshita Bhagia, Dustin Schwenk, David Wadden, Alexander Wettig, Binyuan Hui, Tim Dettmers, Douwe Kiela, Ali Farhadi, and et al. 2025. OLMoE: Open Mixture-of-Experts Language Models. In ICLR. OpenReview.net."},{"key":"e_1_3_2_2_37_1","first-page":"311","article-title":"Bleu: a Method for Automatic Evaluation of Machine Translation","author":"Papineni Kishore","year":"2002","unstructured":"Kishore Papineni, Salim Roukos, Todd Ward, and Wei-Jing Zhu. 2002. Bleu: a Method for Automatic Evaluation of Machine Translation. In ACL. 311-318.","journal-title":"ACL."},{"key":"e_1_3_2_2_38_1","first-page":"186","article-title":"A Call for Clarity in Reporting BLEU Scores","author":"Post Matt","year":"2018","unstructured":"Matt Post. 2018. A Call for Clarity in Reporting BLEU Scores. In WMT. 186-191.","journal-title":"WMT."},{"key":"e_1_3_2_2_39_1","unstructured":"Vinay Venkatesh Ramasesh Ethan Dyer and Maithra Raghu. 2021. Anatomy of Catastrophic Forgetting: Hidden Representations and Task Semantics. In ICLR."},{"key":"e_1_3_2_2_40_1","unstructured":"Victor Sanh Albert Webson Colin Raffel Stephen Bach Lintang Sutawika Zaid Alyafeai Antoine Chaffin Arnaud Stiegler Arun Raja Manan Dey M Saiful Bari Canwen Xu Urmish Thakker Shanya Sharma Sharma Eliza Szczechla Taewoon Kim Gunjan Chhablani Nihal Nayak Debajyoti Datta Jonathan Chang Mike Tian-Jian Jiang Han Wang Matteo Manica Sheng Shen Zheng Xin Yong Harshit Pandey Rachel Bawden Thomas Wang Trishala Neeraj Jos Rozen Abheesht Sharma Andrea Santilli Thibault Fevry Jason Alan Fries Ryan Teehan Teven Le Scao Stella Biderman Leo Gao Thomas Wolf and Alexander M Rush. 2022. Multitask Prompted Training Enables Zero-Shot Task Generalization. In ICLR."},{"key":"e_1_3_2_2_41_1","unstructured":"Teven Le Scao Angela Fan Christopher Akiki Ellie Pavlick Suzana Ilic Daniel Hesslow Roman Castagn\u00e9 Alexandra Sasha Luccioni Fran\u00e7ois Yvon Matthias Gall\u00e9 Jonathan Tow Alexander M. Rush Stella Biderman Albert Webson Pawan Sasanka Ammanamanchi Thomas Wang Beno\u00eet Sagot Niklas Muennighoff Albert Villanova del Moral Olatunji Ruwase Rachel Bawden Stas Bekman Angelina McMillan-Major Iz Beltagy Huu Nguyen Lucile Saulnier Samson Tan Pedro Ortiz Suarez Victor Sanh Hugo Lauren\u00e7on Yacine Jernite Julien Launay Margaret Mitchell Colin Raffel Aaron Gokaslan Adi Simhi Aitor Soroa Alham Fikri Aji Amit Alfassy Anna Rogers Ariel Kreisberg Nitzav Canwen Xu Chenghao Mou Chris Emezue Christopher Klamm Colin Leong Daniel van Strien David Ifeoluwa Adelani and et al. 2022. BLOOM: A 176B-Parameter Open-Access Multilingual Language Model. CoRR abs\/2211.05100 (2022)."},{"key":"e_1_3_2_2_42_1","unstructured":"Noam Shazeer Azalia Mirhoseini Krzysztof Maziarz Andy Davis Quoc V. Le Geoffrey E. Hinton and Jeff Dean. 2017. Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts Layer. In ICLR."},{"key":"e_1_3_2_2_43_1","volume-title":"Hashimoto","author":"Taori Rohan","year":"2023","unstructured":"Rohan Taori, Ishaan Gulrajani, Tianyi Zhang, Yann Dubois, Xuechen Li, Carlos Guestrin, Percy Liang, and Tatsunori B. Hashimoto. 2023. Alpaca: A Strong, Replicable Instruction-Following Model. Stanford Center for Research on Foundation Models (CRFM) blog. https:\/\/crfm.stanford.edu\/2023\/03\/13\/alpaca.html"},{"key":"e_1_3_2_2_44_1","volume-title":"LLaMA: Open and Efficient Foundation Language Models. CoRR abs\/2302.13971","author":"Touvron Hugo","year":"2023","unstructured":"Hugo Touvron, Thibaut Lavril, Gautier Izacard, Xavier Martinet, Marie-Anne Lachaux, Timoth\u00e9e Lacroix, Baptiste Rozi\u00e8re, Naman Goyal, Eric Hambro, Faisal Azhar, Aur\u00e9lien Rodriguez, Armand Joulin, Edouard Grave, and Guillaume Lample. 2023. LLaMA: Open and Efficient Foundation Language Models. CoRR abs\/2302.13971 (2023)."},{"key":"e_1_3_2_2_45_1","first-page":"5998","article-title":"Attention Is All You Need","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, and etc. 2017. Attention Is All You Need. In NIPS. 5998-6008.","journal-title":"NIPS."},{"key":"e_1_3_2_2_46_1","first-page":"5744","article-title":"AdaMix","author":"Wang Yaqing","year":"2022","unstructured":"Yaqing Wang, Sahaj Agarwal, Subhabrata Mukherjee, Xiaodong Liu, Jing Gao, Ahmed Hassan Awadallah, and Jianfeng Gao. 2022. AdaMix: Mixture-of-Adaptations for Parameter-efficient Model Tuning. In EMNLP. 5744-5760.","journal-title":"Mixture-of-Adaptations for Parameter-efficient Model Tuning. In EMNLP."},{"key":"e_1_3_2_2_47_1","first-page":"485","article-title":"Friendly Topic Assistant for Transformer Based Abstractive Summarization","author":"Wang Zhengjue","year":"2020","unstructured":"Zhengjue Wang, Zhibin Duan, Hao Zhang, Chaojie Wang, and etc. 2020. Friendly Topic Assistant for Transformer Based Abstractive Summarization. In EMNLP. 485-497.","journal-title":"EMNLP."},{"key":"e_1_3_2_2_48_1","volume-title":"Brian Lester, Nan Du, Andrew M. Dai, and Quoc V Le.","author":"Wei Jason","year":"2023","unstructured":"Jason Wei, Maarten Bosma, Vincent Zhao, Kelvin Guu, Adams Wei Yu, Brian Lester, Nan Du, Andrew M. Dai, and Quoc V Le. 2023. Finetuned Language Models are Zero-Shot Learners. In ICLR. OpenReview.net."},{"key":"e_1_3_2_2_49_1","volume-title":"Routing Experts: Learning to Route Dynamic Experts in Existing Multi-modal Large Language Models. In ICLR.","author":"Wu Qiong","year":"2025","unstructured":"Qiong Wu, Zhaoxi Ke, Yiyi Zhou, Xiaoshuai Sun, and Rongrong Ji. 2025. Routing Experts: Learning to Route Dynamic Experts in Existing Multi-modal Large Language Models. In ICLR."},{"key":"e_1_3_2_2_50_1","volume-title":"ReFT: Representation Finetuning for Language Models. CoRR abs\/2404.03592","author":"Wu Zhengxuan","year":"2024","unstructured":"Zhengxuan Wu, Aryaman Arora, Zheng Wang, Atticus Geiger, Dan Jurafsky, Christopher D. Manning, and Christopher Potts. 2024. ReFT: Representation Finetuning for Language Models. CoRR abs\/2404.03592 (2024)."},{"key":"e_1_3_2_2_51_1","volume-title":"Xiaohui Tao, and Fu Lee Wang.","author":"Xu Lingling","year":"2023","unstructured":"Lingling Xu, Haoran Xie, Si-Zhao Joe Qin, Xiaohui Tao, and Fu Lee Wang. 2023. Parameter-Efficient Fine-Tuning Methods for Pretrained Language Models:A Critical Review and Assessment. CoRR abs\/2312.12148 (2023)."},{"key":"e_1_3_2_2_52_1","unstructured":"Xinyue Xu Yi Qin Lu Mi Hao Wang and Xiaomeng Li. 2024. Energy-Based Concept Bottleneck Models: Unifying Prediction Concept Intervention and Probabilistic Interpretations. In ICLR."},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"crossref","unstructured":"Elad Ben Zaken Yoav Goldberg and Shauli Ravfogel. 2022. BitFit: Simple Parameter-efficient Fine-tuning for Transformer-based Masked Language-models. In ACL Volume 2: Short Papers. ACL.","DOI":"10.18653\/v1\/2022.acl-short.1"},{"key":"e_1_3_2_2_54_1","unstructured":"Ningyu Zhang Luoqiu Li Xiang Chen Shumin Deng Zhen Bi Chuanqi Tan Fei Huang and Huajun Chen. 2022. Differentiable Prompt Makes Pre-trained Language Models Better Few-shot Learners. In ICLR. OpenReview.net."},{"key":"e_1_3_2_2_55_1","volume-title":"Todor Mihaylov, Myle Ott, Sam Shleifer, Kurt Shuster, Daniel Simig, Punit Singh Koura, Anjali Sridhar, Tianlu Wang, and Luke Zettlemoyer.","author":"Zhang Susan","year":"2022","unstructured":"Susan Zhang, Stephen Roller, Naman Goyal, Mikel Artetxe, Moya Chen, Shuohui Chen, Christopher Dewan, Mona Diab, Xian Li, Xi Victoria Lin, Todor Mihaylov, Myle Ott, Sam Shleifer, Kurt Shuster, Daniel Simig, Punit Singh Koura, Anjali Sridhar, Tianlu Wang, and Luke Zettlemoyer. 2022. OPT: Open Pre-trained Transformer Language Models. CoRR abs\/2205.01068 (2022)."},{"key":"e_1_3_2_2_56_1","unstructured":"Tianyi Zhang Varsha Kishore Felix Wu Kilian Q. Weinberger and Yoav Artzi. [n.d.]. BERTScore: Evaluating Text Generation with BERT BOOKTITLE =."}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Toronto ON Canada","acronym":"KDD '25","sponsor":["SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.2"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3711896.3737013","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T18:16:31Z","timestamp":1777572991000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711896.3737013"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,3]]},"references-count":56,"alternative-id":["10.1145\/3711896.3737013","10.1145\/3711896"],"URL":"https:\/\/doi.org\/10.1145\/3711896.3737013","relation":{},"subject":[],"published":{"date-parts":[[2025,8,3]]},"assertion":[{"value":"2025-08-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}